Train size: 80 Test size: 20
	Tokenizer: allenai/longformer-base-4096 Model: allenai/longformer-base-4096


		-------------RUN 1-----------
			------------EPOCH 1---------------
Evaluating
				 {'precision': {'supports': 0.7269338303821062, 'contradicts': 0.09090909090909091, 'parts_of_same': 0.0}, 'recall': {'supports': 0.9873417721518988, 'contradicts': 0.008333333333333333, 'parts_of_same': 0.0}, 'f1': {'supports': 0.8373590982286634, 'contradicts': 0.015267175572519083, 'parts_of_same': 0.0}, 'support': {'supports': 790, 'contradicts': 120, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.7204797047970479, 'recall': 0.7204797047970479, 'f1': 0.7204797047970478, 'support': None}, 'macro_avg': {'precision': 0.27261430709706574, 'recall': 0.3318917018284107, 'f1': 0.2842087579337275, 'support': None}, 'weighted_avg': {'precision': 0.5398402370027259, 'recall': 0.7204797047970479, 'f1': 0.6119425725731977, 'support': None}}
Loss: tensor(0.3064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 2---------------
Evaluating
				 {'precision': {'supports': 0.9657534246575342, 'contradicts': 0.4166666666666667, 'parts_of_same': 0.5653846153846154}, 'recall': {'supports': 0.7139240506329114, 'contradicts': 0.8333333333333334, 'parts_of_same': 0.8448275862068966}, 'f1': {'supports': 0.8209606986899564, 'contradicts': 0.5555555555555556, 'parts_of_same': 0.6774193548387097}, 'support': {'supports': 790, 'contradicts': 120, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.7481549815498155, 'recall': 0.7481549815498155, 'f1': 0.7481549815498154, 'support': None}, 'macro_avg': {'precision': 0.6492682355696054, 'recall': 0.7973616567243805, 'f1': 0.6846452030280737, 'support': None}, 'weighted_avg': {'precision': 0.8407030706239623, 'recall': 0.7481549815498155, 'f1': 0.7685392863225716, 'support': None}}
Loss: tensor(0.2013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 3---------------
Evaluating
				 {'precision': {'supports': 0.9418777943368107, 'contradicts': 0.5838926174496645, 'parts_of_same': 0.5568181818181818}, 'recall': {'supports': 0.8, 'contradicts': 0.725, 'parts_of_same': 0.8448275862068966}, 'f1': {'supports': 0.8651608487337441, 'contradicts': 0.6468401486988847, 'parts_of_same': 0.6712328767123287}, 'support': {'supports': 790, 'contradicts': 120, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.7988929889298892, 'recall': 0.7988929889298892, 'f1': 0.7988929889298891, 'support': None}, 'macro_avg': {'precision': 0.694196197868219, 'recall': 0.7899425287356321, 'f1': 0.7277446247149859, 'support': None}, 'weighted_avg': {'precision': 0.8404399771738043, 'recall': 0.7988929889298892, 'f1': 0.8098638458408387, 'support': None}}
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1888, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 4---------------
Evaluating
				 {'precision': {'supports': 0.9140625, 'contradicts': 0.5737704918032787, 'parts_of_same': 0.6855670103092784}, 'recall': {'supports': 0.8886075949367088, 'contradicts': 0.5833333333333334, 'parts_of_same': 0.764367816091954}, 'f1': {'supports': 0.9011553273427472, 'contradicts': 0.5785123966942148, 'parts_of_same': 0.7228260869565217}, 'support': {'supports': 790, 'contradicts': 120, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.834870848708487, 'recall': 0.834870848708487, 'f1': 0.834870848708487, 'support': None}, 'macro_avg': {'precision': 0.7244666673708524, 'recall': 0.7454362481206654, 'f1': 0.7341646036644945, 'support': None}, 'weighted_avg': {'precision': 0.8397144776846936, 'recall': 0.834870848708487, 'f1': 0.8368135934820211, 'support': None}}
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 5---------------
Evaluating
				 {'precision': {'supports': 0.9290586630286494, 'contradicts': 0.5116279069767442, 'parts_of_same': 0.7597765363128491}, 'recall': {'supports': 0.8620253164556962, 'contradicts': 0.7333333333333333, 'parts_of_same': 0.7816091954022989}, 'f1': {'supports': 0.8942875902823375, 'contradicts': 0.6027397260273971, 'parts_of_same': 0.7705382436260623}, 'support': {'supports': 790, 'contradicts': 120, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.834870848708487, 'recall': 0.834870848708487, 'f1': 0.834870848708487, 'support': None}, 'macro_avg': {'precision': 0.7334877021060809, 'recall': 0.7923226150637762, 'f1': 0.7558551866452655, 'support': None}, 'weighted_avg': {'precision': 0.855676023937526, 'recall': 0.834870848708487, 'f1': 0.8421490939458203, 'support': None}}
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 6---------------
Evaluating
				 {'precision': {'supports': 0.9173027989821882, 'contradicts': 0.6357142857142857, 'parts_of_same': 0.7848101265822784}, 'recall': {'supports': 0.9126582278481012, 'contradicts': 0.7416666666666667, 'parts_of_same': 0.7126436781609196}, 'f1': {'supports': 0.9149746192893401, 'contradicts': 0.6846153846153846, 'parts_of_same': 0.746987951807229}, 'support': {'supports': 790, 'contradicts': 120, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8616236162361623, 'recall': 0.8616236162361623, 'f1': 0.8616236162361623, 'support': None}, 'macro_avg': {'precision': 0.7792757370929175, 'recall': 0.788989524225229, 'f1': 0.7821926519039845, 'support': None}, 'weighted_avg': {'precision': 0.8648633648588187, 'recall': 0.8616236162361623, 'f1': 0.8625089474233235, 'support': None}}
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1672e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 7---------------
Evaluating
				 {'precision': {'supports': 0.9437229437229437, 'contradicts': 0.4873096446700508, 'parts_of_same': 0.711340206185567}, 'recall': {'supports': 0.8278481012658228, 'contradicts': 0.8, 'parts_of_same': 0.7931034482758621}, 'f1': {'supports': 0.8819959541469993, 'contradicts': 0.6056782334384859, 'parts_of_same': 0.75}, 'support': {'supports': 790, 'contradicts': 120, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8191881918819188, 'recall': 0.8191881918819188, 'f1': 0.8191881918819188, 'support': None}, 'macro_avg': {'precision': 0.7141242648595205, 'recall': 0.8069838498472283, 'f1': 0.7458913958618284, 'support': None}, 'weighted_avg': {'precision': 0.8558961981345206, 'recall': 0.8191881918819188, 'f1': 0.830219734122461, 'support': None}}
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 8---------------
Evaluating
				 {'precision': {'supports': 0.9228758169934641, 'contradicts': 0.6434782608695652, 'parts_of_same': 0.6813725490196079}, 'recall': {'supports': 0.8936708860759494, 'contradicts': 0.6166666666666667, 'parts_of_same': 0.7988505747126436}, 'f1': {'supports': 0.9080385852090032, 'contradicts': 0.6297872340425532, 'parts_of_same': 0.7354497354497354}, 'support': {'supports': 790, 'contradicts': 120, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8477859778597786, 'recall': 0.8477859778597786, 'f1': 0.8477859778597786, 'support': None}, 'macro_avg': {'precision': 0.7492422089608791, 'recall': 0.7697293758184198, 'f1': 0.757758518233764, 'support': None}, 'weighted_avg': {'precision': 0.8531809135226901, 'recall': 0.8477859778597786, 'f1': 0.8495324763546798, 'support': None}}
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 9---------------
Evaluating
				 {'precision': {'supports': 0.8958333333333334, 'contradicts': 0.5894039735099338, 'parts_of_same': 0.8888888888888888}, 'recall': {'supports': 0.9253164556962026, 'contradicts': 0.7416666666666667, 'parts_of_same': 0.5977011494252874}, 'f1': {'supports': 0.9103362391033624, 'contradicts': 0.6568265682656826, 'parts_of_same': 0.7147766323024054}, 'support': {'supports': 790, 'contradicts': 120, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8523985239852399, 'recall': 0.8523985239852399, 'f1': 0.8523985239852399, 'support': None}, 'macro_avg': {'precision': 0.7913753985773854, 'recall': 0.7548947572627189, 'f1': 0.7606464798904836, 'support': None}, 'weighted_avg': {'precision': 0.860796565333203, 'recall': 0.8523985239852399, 'f1': 0.8508818737123218, 'support': None}}
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 10---------------
Evaluating
				 {'precision': {'supports': 0.9060568603213844, 'contradicts': 0.6693548387096774, 'parts_of_same': 0.8079470198675497}, 'recall': {'supports': 0.9278481012658227, 'contradicts': 0.6916666666666667, 'parts_of_same': 0.7011494252873564}, 'f1': {'supports': 0.9168230143839899, 'contradicts': 0.6803278688524591, 'parts_of_same': 0.7507692307692307}, 'support': {'supports': 790, 'contradicts': 120, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8653136531365314, 'recall': 0.8653136531365314, 'f1': 0.8653136531365314, 'support': None}, 'macro_avg': {'precision': 0.7944529062995372, 'recall': 0.7735547310732819, 'f1': 0.7826400380018933, 'support': None}, 'weighted_avg': {'precision': 0.8641054259741776, 'recall': 0.8653136531365314, 'f1': 0.863988350350086, 'support': None}}
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 11---------------
Evaluating
				 {'precision': {'supports': 0.9172056921086675, 'contradicts': 0.6220472440944882, 'parts_of_same': 0.7445652173913043}, 'recall': {'supports': 0.8974683544303798, 'contradicts': 0.6583333333333333, 'parts_of_same': 0.7873563218390804}, 'f1': {'supports': 0.9072296865003199, 'contradicts': 0.6396761133603238, 'parts_of_same': 0.76536312849162}, 'support': {'supports': 790, 'contradicts': 120, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8533210332103321, 'recall': 0.8533210332103321, 'f1': 0.8533210332103321, 'support': None}, 'macro_avg': {'precision': 0.76127271786482, 'recall': 0.7810526698675978, 'f1': 0.7707563094507547, 'support': None}, 'weighted_avg': {'precision': 0.8568196622539418, 'recall': 0.8533210332103321, 'f1': 0.8548392714908057, 'support': None}}
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0478e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 12---------------
Evaluating
				 {'precision': {'supports': 0.9084967320261438, 'contradicts': 0.5652173913043478, 'parts_of_same': 0.7016574585635359}, 'recall': {'supports': 0.879746835443038, 'contradicts': 0.65, 'parts_of_same': 0.7298850574712644}, 'f1': {'supports': 0.8938906752411575, 'contradicts': 0.6046511627906976, 'parts_of_same': 0.7154929577464789}, 'support': {'supports': 790, 'contradicts': 120, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8302583025830258, 'recall': 0.8302583025830258, 'f1': 0.8302583025830258, 'support': None}, 'macro_avg': {'precision': 0.7251238606313425, 'recall': 0.7532106309714343, 'f1': 0.7380115985927781, 'support': None}, 'weighted_avg': {'precision': 0.8372941910029803, 'recall': 0.8302583025830258, 'f1': 0.8332357450399313, 'support': None}}
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 13---------------
Evaluating
				 {'precision': {'supports': 0.9245033112582781, 'contradicts': 0.6240601503759399, 'parts_of_same': 0.6938775510204082}, 'recall': {'supports': 0.8835443037974684, 'contradicts': 0.6916666666666667, 'parts_of_same': 0.7816091954022989}, 'f1': {'supports': 0.9035598705501617, 'contradicts': 0.6561264822134386, 'parts_of_same': 0.7351351351351352}, 'support': {'supports': 790, 'contradicts': 120, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8459409594095941, 'recall': 0.8459409594095941, 'f1': 0.8459409594095942, 'support': None}, 'macro_avg': {'precision': 0.7474803375515421, 'recall': 0.785606721955478, 'f1': 0.7649404959662451, 'support': None}, 'weighted_avg': {'precision': 0.8542246566574755, 'recall': 0.8459409594095941, 'f1': 0.849133753794976, 'support': None}}
Loss: tensor(3.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 14---------------
Evaluating
				 {'precision': {'supports': 0.9182305630026809, 'contradicts': 0.5432098765432098, 'parts_of_same': 0.6988636363636364}, 'recall': {'supports': 0.8670886075949367, 'contradicts': 0.7333333333333333, 'parts_of_same': 0.7068965517241379}, 'f1': {'supports': 0.8919270833333333, 'contradicts': 0.624113475177305, 'parts_of_same': 0.7028571428571428}, 'support': {'supports': 790, 'contradicts': 120, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8265682656826568, 'recall': 0.8265682656826568, 'f1': 0.8265682656826568, 'support': None}, 'macro_avg': {'precision': 0.720101358636509, 'recall': 0.7691061642174692, 'f1': 0.7396325671225936, 'support': None}, 'weighted_avg': {'precision': 0.8415033235097563, 'recall': 0.8265682656826568, 'f1': 0.8319309554536464, 'support': None}}
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 15---------------
Evaluating
				 {'precision': {'supports': 0.9129353233830846, 'contradicts': 0.7064220183486238, 'parts_of_same': 0.7719298245614035}, 'recall': {'supports': 0.9291139240506329, 'contradicts': 0.6416666666666667, 'parts_of_same': 0.7586206896551724}, 'f1': {'supports': 0.9209535759096613, 'contradicts': 0.6724890829694324, 'parts_of_same': 0.7652173913043477}, 'support': {'supports': 790, 'contradicts': 120, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8699261992619927, 'recall': 0.8699261992619927, 'f1': 0.8699261992619927, 'support': None}, 'macro_avg': {'precision': 0.797095722097704, 'recall': 0.7764670934574905, 'f1': 0.7862200167278138, 'support': None}, 'weighted_avg': {'precision': 0.867440347922653, 'recall': 0.8699261992619927, 'f1': 0.8684500378338754, 'support': None}}
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0742e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 16---------------
Evaluating
				 {'precision': {'supports': 0.8911242603550296, 'contradicts': 0.7142857142857143, 'parts_of_same': 0.8432835820895522}, 'recall': {'supports': 0.9531645569620253, 'contradicts': 0.625, 'parts_of_same': 0.6494252873563219}, 'f1': {'supports': 0.9211009174311926, 'contradicts': 0.6666666666666666, 'parts_of_same': 0.7337662337662338}, 'support': {'supports': 790, 'contradicts': 120, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8680811808118081, 'recall': 0.8680811808118081, 'f1': 0.868081180811808, 'support': None}, 'macro_avg': {'precision': 0.8162311855767653, 'recall': 0.7425299481061157, 'f1': 0.7738446059546978, 'support': None}, 'weighted_avg': {'precision': 0.8638688142789125, 'recall': 0.8680811808118081, 'f1': 0.862864436758272, 'support': None}}
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3716e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 17---------------
Evaluating
				 {'precision': {'supports': 0.9066339066339066, 'contradicts': 0.7009345794392523, 'parts_of_same': 0.7668711656441718}, 'recall': {'supports': 0.9341772151898734, 'contradicts': 0.625, 'parts_of_same': 0.7183908045977011}, 'f1': {'supports': 0.9201995012468829, 'contradicts': 0.6607929515418502, 'parts_of_same': 0.7418397626112758}, 'support': {'supports': 790, 'contradicts': 120, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8653136531365314, 'recall': 0.8653136531365314, 'f1': 0.8653136531365314, 'support': None}, 'macro_avg': {'precision': 0.7914798839057768, 'recall': 0.7591893399291916, 'f1': 0.7742774051333363, 'support': None}, 'weighted_avg': {'precision': 0.8614285226896518, 'recall': 0.8653136531365314, 'f1': 0.8628532092845217, 'support': None}}
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 18---------------
Evaluating
				 {'precision': {'supports': 0.9036585365853659, 'contradicts': 0.7037037037037037, 'parts_of_same': 0.7884615384615384}, 'recall': {'supports': 0.9379746835443038, 'contradicts': 0.6333333333333333, 'parts_of_same': 0.7068965517241379}, 'f1': {'supports': 0.9204968944099379, 'contradicts': 0.6666666666666667, 'parts_of_same': 0.7454545454545455}, 'support': {'supports': 790, 'contradicts': 120, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8671586715867159, 'recall': 0.8671586715867159, 'f1': 0.8671586715867159, 'support': None}, 'macro_avg': {'precision': 0.7986079262502027, 'recall': 0.7594015228672584, 'f1': 0.7775393688437168, 'support': None}, 'weighted_avg': {'precision': 0.8630322841689955, 'recall': 0.8671586715867159, 'f1': 0.8643004035912748, 'support': None}}
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 19---------------
Evaluating
				 {'precision': {'supports': 0.9038929440389294, 'contradicts': 0.7037037037037037, 'parts_of_same': 0.7987012987012987}, 'recall': {'supports': 0.9405063291139241, 'contradicts': 0.6333333333333333, 'parts_of_same': 0.7068965517241379}, 'f1': {'supports': 0.9218362282878413, 'contradicts': 0.6666666666666667, 'parts_of_same': 0.75}, 'support': {'supports': 790, 'contradicts': 120, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8690036900369004, 'recall': 0.8690036900369004, 'f1': 0.8690036900369004, 'support': None}, 'macro_avg': {'precision': 0.8020993154813105, 'recall': 0.7602454047237984, 'f1': 0.779500964984836, 'support': None}, 'weighted_avg': {'precision': 0.8648467677206869, 'recall': 0.8690036900369004, 'f1': 0.8660061073315448, 'support': None}}
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4434e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 20---------------
Evaluating
				 {'precision': {'supports': 0.908641975308642, 'contradicts': 0.6851851851851852, 'parts_of_same': 0.7650602409638554}, 'recall': {'supports': 0.9316455696202531, 'contradicts': 0.6166666666666667, 'parts_of_same': 0.7298850574712644}, 'f1': {'supports': 0.92, 'contradicts': 0.6491228070175439, 'parts_of_same': 0.7470588235294118}, 'support': {'supports': 790, 'contradicts': 120, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8643911439114391, 'recall': 0.8643911439114391, 'f1': 0.8643911439114391, 'support': None}, 'macro_avg': {'precision': 0.7862958004858941, 'recall': 0.7593990979193949, 'f1': 0.7720605435156519, 'support': None}, 'weighted_avg': {'precision': 0.860857808711956, 'recall': 0.8643911439114391, 'f1': 0.8622536643323091, 'support': None}}
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8838e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 21---------------
Evaluating
				 {'precision': {'supports': 0.902676399026764, 'contradicts': 0.6814159292035398, 'parts_of_same': 0.8120805369127517}, 'recall': {'supports': 0.9392405063291139, 'contradicts': 0.6416666666666667, 'parts_of_same': 0.6954022988505747}, 'f1': {'supports': 0.9205955334987593, 'contradicts': 0.6609442060085837, 'parts_of_same': 0.7492260061919505}, 'support': {'supports': 790, 'contradicts': 120, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8671586715867159, 'recall': 0.8671586715867159, 'f1': 0.8671586715867159, 'support': None}, 'macro_avg': {'precision': 0.7987242883810186, 'recall': 0.7587698239487851, 'f1': 0.776921915233098, 'support': None}, 'weighted_avg': {'precision': 0.8636404798509105, 'recall': 0.8671586715867159, 'f1': 0.864344189356503, 'support': None}}
Loss: tensor(5.6281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1465e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 22---------------
Evaluating
				 {'precision': {'supports': 0.9008464328899637, 'contradicts': 0.6936936936936937, 'parts_of_same': 0.815068493150685}, 'recall': {'supports': 0.9430379746835443, 'contradicts': 0.6416666666666667, 'parts_of_same': 0.6839080459770115}, 'f1': {'supports': 0.9214594928880644, 'contradicts': 0.6666666666666667, 'parts_of_same': 0.7437499999999999}, 'support': {'supports': 790, 'contradicts': 120, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8680811808118081, 'recall': 0.8680811808118081, 'f1': 0.868081180811808, 'support': None}, 'macro_avg': {'precision': 0.8032028732447808, 'recall': 0.7562042291090743, 'f1': 0.7772920531849103, 'support': None}, 'weighted_avg': {'precision': 0.8641456116554739, 'recall': 0.8680811808118081, 'f1': 0.8647283204627038, 'support': None}}
Loss: tensor(1.8913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 23---------------
Evaluating
				 {'precision': {'supports': 0.8997584541062802, 'contradicts': 0.6936936936936937, 'parts_of_same': 0.8137931034482758}, 'recall': {'supports': 0.9430379746835443, 'contradicts': 0.6416666666666667, 'parts_of_same': 0.6781609195402298}, 'f1': {'supports': 0.9208899876390606, 'contradicts': 0.6666666666666667, 'parts_of_same': 0.7398119122257054}, 'support': {'supports': 790, 'contradicts': 120, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8671586715867159, 'recall': 0.8671586715867159, 'f1': 0.8671586715867159, 'support': None}, 'macro_avg': {'precision': 0.8024150837494166, 'recall': 0.7542885202968136, 'f1': 0.7757895221771443, 'support': None}, 'weighted_avg': {'precision': 0.8631479907631038, 'recall': 0.8671586715867159, 'f1': 0.863681146644032, 'support': None}}
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8174e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1601e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 24---------------
Evaluating
				 {'precision': {'supports': 0.9007263922518159, 'contradicts': 0.6936936936936937, 'parts_of_same': 0.8095238095238095}, 'recall': {'supports': 0.9417721518987342, 'contradicts': 0.6416666666666667, 'parts_of_same': 0.6839080459770115}, 'f1': {'supports': 0.9207920792079207, 'contradicts': 0.6666666666666667, 'parts_of_same': 0.7414330218068536}, 'support': {'supports': 790, 'contradicts': 120, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8671586715867159, 'recall': 0.8671586715867159, 'f1': 0.8671586715867159, 'support': None}, 'macro_avg': {'precision': 0.8013146318231064, 'recall': 0.7557822881808042, 'f1': 0.7762972558938137, 'support': None}, 'weighted_avg': {'precision': 0.8631681143720671, 'recall': 0.8671586715867159, 'f1': 0.8638700077201568, 'support': None}}
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 25---------------
Evaluating
				 {'precision': {'supports': 0.9018181818181819, 'contradicts': 0.6936936936936937, 'parts_of_same': 0.8108108108108109}, 'recall': {'supports': 0.9417721518987342, 'contradicts': 0.6416666666666667, 'parts_of_same': 0.6896551724137931}, 'f1': {'supports': 0.9213622291021671, 'contradicts': 0.6666666666666667, 'parts_of_same': 0.7453416149068324}, 'support': {'supports': 790, 'contradicts': 120, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8680811808118081, 'recall': 0.8680811808118081, 'f1': 0.868081180811808, 'support': None}, 'macro_avg': {'precision': 0.8021075621075622, 'recall': 0.7576979969930647, 'f1': 0.777790170225222, 'support': None}, 'weighted_avg': {'precision': 0.8641703763474983, 'recall': 0.8680811808118081, 'f1': 0.8649129169598716, 'support': None}}
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3174e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 26---------------
Evaluating
				 {'precision': {'supports': 0.9018181818181819, 'contradicts': 0.6936936936936937, 'parts_of_same': 0.8108108108108109}, 'recall': {'supports': 0.9417721518987342, 'contradicts': 0.6416666666666667, 'parts_of_same': 0.6896551724137931}, 'f1': {'supports': 0.9213622291021671, 'contradicts': 0.6666666666666667, 'parts_of_same': 0.7453416149068324}, 'support': {'supports': 790, 'contradicts': 120, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8680811808118081, 'recall': 0.8680811808118081, 'f1': 0.868081180811808, 'support': None}, 'macro_avg': {'precision': 0.8021075621075622, 'recall': 0.7576979969930647, 'f1': 0.777790170225222, 'support': None}, 'weighted_avg': {'precision': 0.8641703763474983, 'recall': 0.8680811808118081, 'f1': 0.8649129169598716, 'support': None}}
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8817e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1576e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3202e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6057e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 27---------------
Evaluating
				 {'precision': {'supports': 0.9018181818181819, 'contradicts': 0.6936936936936937, 'parts_of_same': 0.8108108108108109}, 'recall': {'supports': 0.9417721518987342, 'contradicts': 0.6416666666666667, 'parts_of_same': 0.6896551724137931}, 'f1': {'supports': 0.9213622291021671, 'contradicts': 0.6666666666666667, 'parts_of_same': 0.7453416149068324}, 'support': {'supports': 790, 'contradicts': 120, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8680811808118081, 'recall': 0.8680811808118081, 'f1': 0.868081180811808, 'support': None}, 'macro_avg': {'precision': 0.8021075621075622, 'recall': 0.7576979969930647, 'f1': 0.777790170225222, 'support': None}, 'weighted_avg': {'precision': 0.8641703763474983, 'recall': 0.8680811808118081, 'f1': 0.8649129169598716, 'support': None}}
Loss: tensor(2.8117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6484e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6396e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1576e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7006e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9678e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1576e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9155e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7345e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7006e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9766e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3386e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0965e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 28---------------
Evaluating
				 {'precision': {'supports': 0.9018181818181819, 'contradicts': 0.6936936936936937, 'parts_of_same': 0.8108108108108109}, 'recall': {'supports': 0.9417721518987342, 'contradicts': 0.6416666666666667, 'parts_of_same': 0.6896551724137931}, 'f1': {'supports': 0.9213622291021671, 'contradicts': 0.6666666666666667, 'parts_of_same': 0.7453416149068324}, 'support': {'supports': 790, 'contradicts': 120, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8680811808118081, 'recall': 0.8680811808118081, 'f1': 0.868081180811808, 'support': None}, 'macro_avg': {'precision': 0.8021075621075622, 'recall': 0.7576979969930647, 'f1': 0.777790170225222, 'support': None}, 'weighted_avg': {'precision': 0.8641703763474983, 'recall': 0.8680811808118081, 'f1': 0.8649129169598716, 'support': None}}
Loss: tensor(2.5955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8633e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9155e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1914e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5961e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3386e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2679e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9678e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4247e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9155e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9766e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0104e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9766e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7006e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1730e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7867e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4674e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7684e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3725e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7006e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7771e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4847e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8817e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 29---------------
Evaluating
				 {'precision': {'supports': 0.9018181818181819, 'contradicts': 0.6875, 'parts_of_same': 0.8163265306122449}, 'recall': {'supports': 0.9417721518987342, 'contradicts': 0.6416666666666667, 'parts_of_same': 0.6896551724137931}, 'f1': {'supports': 0.9213622291021671, 'contradicts': 0.6637931034482759, 'parts_of_same': 0.7476635514018692}, 'support': {'supports': 790, 'contradicts': 120, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8680811808118081, 'recall': 0.8680811808118081, 'f1': 0.868081180811808, 'support': None}, 'macro_avg': {'precision': 0.8018815708101422, 'recall': 0.7576979969930647, 'f1': 0.7776062946507708, 'support': None}, 'weighted_avg': {'precision': 0.8643700922166921, 'recall': 0.8680811808118081, 'f1': 0.864967519694124, 'support': None}}
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7867e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8323e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4247e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7161e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6756e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0531e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5535e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8323e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5535e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7249e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2437e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6484e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3037e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1576e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6822e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0627e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3037e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4847e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2437e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8883e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4847e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0104e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4674e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1409e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7006e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3174e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3386e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6756e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1818e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8738e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6657e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0965e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9417e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1576e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7801e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6657e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0531e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0104e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7006e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4847e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3037e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9339e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0965e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8323e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6840e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8650e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6928e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8738e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7161e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6928e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6657e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1409e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4847e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9417e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8650e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4847e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1576e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3219e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9417e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6822e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 30---------------
Evaluating
				 {'precision': {'supports': 0.9018181818181819, 'contradicts': 0.6875, 'parts_of_same': 0.8163265306122449}, 'recall': {'supports': 0.9417721518987342, 'contradicts': 0.6416666666666667, 'parts_of_same': 0.6896551724137931}, 'f1': {'supports': 0.9213622291021671, 'contradicts': 0.6637931034482759, 'parts_of_same': 0.7476635514018692}, 'support': {'supports': 790, 'contradicts': 120, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8680811808118081, 'recall': 0.8680811808118081, 'f1': 0.868081180811808, 'support': None}, 'macro_avg': {'precision': 0.8018815708101422, 'recall': 0.7576979969930647, 'f1': 0.7776062946507708, 'support': None}, 'weighted_avg': {'precision': 0.8643700922166921, 'recall': 0.8680811808118081, 'f1': 0.864967519694124, 'support': None}}
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6928e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5978e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1409e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7801e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4674e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1818e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5535e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9339e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7278e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7867e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2341e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2341e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9417e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7789e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0781e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7789e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4350e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5978e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2628e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0548e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6928e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9599e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7789e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0818e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6928e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4151e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2341e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3037e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0548e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7789e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6928e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7801e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9599e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6657e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9417e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3037e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4151e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8738e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3219e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4168e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1409e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6657e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7278e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3219e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6484e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6928e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8323e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3386e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4168e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8294e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6928e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8323e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6249e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4151e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4168e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0548e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8738e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4674e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9339e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6484e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9417e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9678e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9599e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2358e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4578e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9599e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1409e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3037e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4847e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0627e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9766e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4168e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4151e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1409e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5299e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3489e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8323e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1679e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3037e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0548e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4350e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8323e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4168e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6928e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6928e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9417e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8738e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9869e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7278e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9582e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6928e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6388e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6756e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0548e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3037e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6484e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2437e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7801e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7345e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8738e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1409e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8198e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7278e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7801e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2358e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6840e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9059e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6756e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4847e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4847e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3489e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7278e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6928e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5299e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7801e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6928e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9417e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9766e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6840e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3725e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1730e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6928e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7278e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8323e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4350e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3037e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6756e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8738e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0548e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5978e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4438e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8323e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6756e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1679e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3401e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6928e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0818e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4438e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6657e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5299e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4168e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8738e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8738e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7006e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6161e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4438e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9869e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7801e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1576e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4847e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8198e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8920e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0548e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9781e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6756e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7249e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7278e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4438e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7801e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6756e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9059e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6928e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9869e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4438e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5029e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6484e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4578e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6756e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3219e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)


		-------------RUN 2-----------
			------------EPOCH 1---------------
Evaluating
				 {'precision': {'supports': 0.0, 'contradicts': 0.07431192660550459, 'parts_of_same': 0.3148148148148148}, 'recall': {'supports': 0.0, 'contradicts': 0.8901098901098901, 'parts_of_same': 0.12454212454212454}, 'f1': {'supports': 0.0, 'contradicts': 0.13717188823031332, 'parts_of_same': 0.1784776902887139}, 'support': {'supports': 834, 'contradicts': 91, 'parts_of_same': 273}, 'micro_avg': {'precision': 0.09599332220367279, 'recall': 0.09599332220367279, 'f1': 0.09599332220367279, 'support': None}, 'macro_avg': {'precision': 0.12970891380677316, 'recall': 0.3382173382173382, 'f1': 0.10521652617300907, 'support': None}, 'weighted_avg': {'precision': 0.0773846659144786, 'recall': 0.09599332220367279, 'f1': 0.05109102777777747, 'support': None}}
Loss: tensor(0.4896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 2---------------
Evaluating
				 {'precision': {'supports': 0.9277929155313351, 'contradicts': 0.5, 'parts_of_same': 0.6802325581395349}, 'recall': {'supports': 0.8165467625899281, 'contradicts': 0.6593406593406593, 'parts_of_same': 0.8571428571428571}, 'f1': {'supports': 0.8686224489795918, 'contradicts': 0.5687203791469195, 'parts_of_same': 0.7585089141004863}, 'support': {'supports': 834, 'contradicts': 91, 'parts_of_same': 273}, 'micro_avg': {'precision': 0.8138564273789649, 'recall': 0.8138564273789649, 'f1': 0.8138564273789649, 'support': None}, 'macro_avg': {'precision': 0.70267515789029, 'recall': 0.7776767596911482, 'f1': 0.7319505807423327, 'support': None}, 'weighted_avg': {'precision': 0.8388837895870004, 'recall': 0.8138564273789649, 'f1': 0.8207492575131736, 'support': None}}
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4230, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 3---------------
Evaluating
				 {'precision': {'supports': 0.950920245398773, 'contradicts': 0.432258064516129, 'parts_of_same': 0.6214833759590793}, 'recall': {'supports': 0.7434052757793765, 'contradicts': 0.7362637362637363, 'parts_of_same': 0.8901098901098901}, 'f1': {'supports': 0.8344549125168237, 'contradicts': 0.5447154471544716, 'parts_of_same': 0.7319277108433734}, 'support': {'supports': 834, 'contradicts': 91, 'parts_of_same': 273}, 'micro_avg': {'precision': 0.7762938230383973, 'recall': 0.7762938230383973, 'f1': 0.7762938230383973, 'support': None}, 'macro_avg': {'precision': 0.6682205619579937, 'recall': 0.7899263007176677, 'f1': 0.7036993568382228, 'support': None}, 'weighted_avg': {'precision': 0.8364506929635835, 'recall': 0.7762938230383973, 'f1': 0.7890824438984381, 'support': None}}
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 4---------------
Evaluating
				 {'precision': {'supports': 0.909933774834437, 'contradicts': 0.42857142857142855, 'parts_of_same': 0.7331081081081081}, 'recall': {'supports': 0.8237410071942446, 'contradicts': 0.6923076923076923, 'parts_of_same': 0.7948717948717948}, 'f1': {'supports': 0.8646947765890497, 'contradicts': 0.5294117647058824, 'parts_of_same': 0.7627416520210896}, 'support': {'supports': 834, 'contradicts': 91, 'parts_of_same': 273}, 'micro_avg': {'precision': 0.8071786310517529, 'recall': 0.8071786310517529, 'f1': 0.807178631051753, 'support': None}, 'macro_avg': {'precision': 0.6905377705046579, 'recall': 0.7703068314579106, 'f1': 0.7189493977720072, 'support': None}, 'weighted_avg': {'precision': 0.8330745256472738, 'recall': 0.8071786310517529, 'f1': 0.81599364379404, 'support': None}}
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 5---------------
Evaluating
				 {'precision': {'supports': 0.9267241379310345, 'contradicts': 0.5571428571428572, 'parts_of_same': 0.5833333333333334}, 'recall': {'supports': 0.7733812949640287, 'contradicts': 0.42857142857142855, 'parts_of_same': 0.9230769230769231}, 'f1': {'supports': 0.8431372549019608, 'contradicts': 0.48447204968944096, 'parts_of_same': 0.7148936170212767}, 'support': {'supports': 834, 'contradicts': 91, 'parts_of_same': 273}, 'micro_avg': {'precision': 0.7813021702838063, 'recall': 0.7813021702838063, 'f1': 0.7813021702838063, 'support': None}, 'macro_avg': {'precision': 0.6890667761357417, 'recall': 0.70834321553746, 'f1': 0.6808343072042261, 'support': None}, 'weighted_avg': {'precision': 0.8203989407633413, 'recall': 0.7813021702838063, 'f1': 0.7866689353562462, 'support': None}}
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 6---------------
Evaluating
				 {'precision': {'supports': 0.9225634178905207, 'contradicts': 0.5333333333333333, 'parts_of_same': 0.6545961002785515}, 'recall': {'supports': 0.8285371702637889, 'contradicts': 0.5274725274725275, 'parts_of_same': 0.8608058608058609}, 'f1': {'supports': 0.8730259001895135, 'contradicts': 0.5303867403314917, 'parts_of_same': 0.7436708860759494}, 'support': {'supports': 834, 'contradicts': 91, 'parts_of_same': 273}, 'micro_avg': {'precision': 0.8130217028380634, 'recall': 0.8130217028380634, 'f1': 0.8130217028380634, 'support': None}, 'macro_avg': {'precision': 0.7034976171674684, 'recall': 0.7389385195140591, 'f1': 0.7156945088656516, 'support': None}, 'weighted_avg': {'precision': 0.8319331880050685, 'recall': 0.8130217028380634, 'f1': 0.8175216577854376, 'support': None}}
Loss: tensor(5.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 7---------------
Evaluating
				 {'precision': {'supports': 0.8677309007981756, 'contradicts': 0.5679012345679012, 'parts_of_same': 0.7958333333333333}, 'recall': {'supports': 0.9124700239808153, 'contradicts': 0.5054945054945055, 'parts_of_same': 0.6996336996336996}, 'f1': {'supports': 0.8895382817066043, 'contradicts': 0.5348837209302326, 'parts_of_same': 0.7446393762183235}, 'support': {'supports': 834, 'contradicts': 91, 'parts_of_same': 273}, 'micro_avg': {'precision': 0.8330550918196995, 'recall': 0.8330550918196995, 'f1': 0.8330550918196995, 'support': None}, 'macro_avg': {'precision': 0.7438218228998034, 'recall': 0.7058660763696736, 'f1': 0.7230204596183868, 'support': None}, 'weighted_avg': {'precision': 0.8285718561029695, 'recall': 0.8330550918196995, 'f1': 0.8295792113986322, 'support': None}}
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 8---------------
Evaluating
				 {'precision': {'supports': 0.8569844789356984, 'contradicts': 0.625, 'parts_of_same': 0.8148148148148148}, 'recall': {'supports': 0.9268585131894485, 'contradicts': 0.5494505494505495, 'parts_of_same': 0.6446886446886447}, 'f1': {'supports': 0.8905529953917051, 'contradicts': 0.5847953216374269, 'parts_of_same': 0.7198364008179959}, 'support': {'supports': 834, 'contradicts': 91, 'parts_of_same': 273}, 'micro_avg': {'precision': 0.833889816360601, 'recall': 0.833889816360601, 'f1': 0.833889816360601, 'support': None}, 'macro_avg': {'precision': 0.7655997645835044, 'recall': 0.7069992357762143, 'f1': 0.731728239282376, 'support': None}, 'weighted_avg': {'precision': 0.8297533387953396, 'recall': 0.833889816360601, 'f1': 0.8284247995400674, 'support': None}}
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 9---------------
Evaluating
				 {'precision': {'supports': 0.89453125, 'contradicts': 0.4909090909090909, 'parts_of_same': 0.659375}, 'recall': {'supports': 0.8237410071942446, 'contradicts': 0.5934065934065934, 'parts_of_same': 0.7728937728937729}, 'f1': {'supports': 0.8576779026217228, 'contradicts': 0.5373134328358209, 'parts_of_same': 0.7116357504215851}, 'support': {'supports': 834, 'contradicts': 91, 'parts_of_same': 273}, 'micro_avg': {'precision': 0.7946577629382304, 'recall': 0.7946577629382304, 'f1': 0.7946577629382304, 'support': None}, 'macro_avg': {'precision': 0.6816051136363637, 'recall': 0.7300137911648702, 'f1': 0.7022090286263762, 'support': None}, 'weighted_avg': {'precision': 0.8102847786082865, 'recall': 0.7946577629382304, 'f1': 0.8000629825038976, 'support': None}}
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 10---------------
Evaluating
				 {'precision': {'supports': 0.9175257731958762, 'contradicts': 0.37583892617449666, 'parts_of_same': 0.6297297297297297}, 'recall': {'supports': 0.7470023980815348, 'contradicts': 0.6153846153846154, 'parts_of_same': 0.8534798534798534}, 'f1': {'supports': 0.8235294117647057, 'contradicts': 0.46666666666666673, 'parts_of_same': 0.7247278382581648}, 'support': {'supports': 834, 'contradicts': 91, 'parts_of_same': 273}, 'micro_avg': {'precision': 0.7612687813021702, 'recall': 0.7612687813021702, 'f1': 0.7612687813021701, 'support': None}, 'macro_avg': {'precision': 0.6410314763667009, 'recall': 0.7386222889820012, 'f1': 0.671641305563179, 'support': None}, 'weighted_avg': {'precision': 0.810796371739112, 'recall': 0.7612687813021702, 'f1': 0.7739072587002589, 'support': None}}
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 11---------------
Evaluating
				 {'precision': {'supports': 0.8994910941475827, 'contradicts': 0.42718446601941745, 'parts_of_same': 0.7346278317152104}, 'recall': {'supports': 0.8477218225419664, 'contradicts': 0.4835164835164835, 'parts_of_same': 0.8315018315018315}, 'f1': {'supports': 0.8728395061728395, 'contradicts': 0.4536082474226804, 'parts_of_same': 0.7800687285223369}, 'support': {'supports': 834, 'contradicts': 91, 'parts_of_same': 273}, 'micro_avg': {'precision': 0.8163606010016694, 'recall': 0.8163606010016694, 'f1': 0.8163606010016694, 'support': None}, 'macro_avg': {'precision': 0.6871011306274036, 'recall': 0.7209133791867605, 'f1': 0.7021721607059522, 'support': None}, 'weighted_avg': {'precision': 0.8260457069992516, 'recall': 0.8163606010016694, 'f1': 0.8198541415277213, 'support': None}}
Loss: tensor(8.1211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 12---------------
Evaluating
				 {'precision': {'supports': 0.8845208845208845, 'contradicts': 0.5542168674698795, 'parts_of_same': 0.7009966777408638}, 'recall': {'supports': 0.8633093525179856, 'contradicts': 0.5054945054945055, 'parts_of_same': 0.7728937728937729}, 'f1': {'supports': 0.8737864077669902, 'contradicts': 0.5287356321839081, 'parts_of_same': 0.7351916376306621}, 'support': {'supports': 834, 'contradicts': 91, 'parts_of_same': 273}, 'micro_avg': {'precision': 0.8155258764607679, 'recall': 0.8155258764607679, 'f1': 0.8155258764607678, 'support': None}, 'macro_avg': {'precision': 0.7132448099105426, 'recall': 0.7138992103020879, 'f1': 0.7125712258605201, 'support': None}, 'weighted_avg': {'precision': 0.8176095539678068, 'recall': 0.8155258764607679, 'f1': 0.8159934254420503, 'support': None}}
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 13---------------
Evaluating
				 {'precision': {'supports': 0.8905882352941177, 'contradicts': 0.6129032258064516, 'parts_of_same': 0.7797202797202797}, 'recall': {'supports': 0.907673860911271, 'contradicts': 0.4175824175824176, 'parts_of_same': 0.8168498168498168}, 'f1': {'supports': 0.8990498812351544, 'contradicts': 0.4967320261437909, 'parts_of_same': 0.7978533094812164}, 'support': {'supports': 834, 'contradicts': 91, 'parts_of_same': 273}, 'micro_avg': {'precision': 0.8497495826377296, 'recall': 0.8497495826377296, 'f1': 0.8497495826377296, 'support': None}, 'macro_avg': {'precision': 0.7610705802736163, 'recall': 0.7140353651145018, 'f1': 0.7312117389533871, 'support': None}, 'weighted_avg': {'precision': 0.8442307330111165, 'recall': 0.8497495826377296, 'f1': 0.8454291893301968, 'support': None}}
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 14---------------
Evaluating
				 {'precision': {'supports': 0.898428053204353, 'contradicts': 0.625, 'parts_of_same': 0.749185667752443}, 'recall': {'supports': 0.8908872901678657, 'contradicts': 0.43956043956043955, 'parts_of_same': 0.8424908424908425}, 'f1': {'supports': 0.8946417820590005, 'contradicts': 0.5161290322580646, 'parts_of_same': 0.7931034482758621}, 'support': {'supports': 834, 'contradicts': 91, 'parts_of_same': 273}, 'micro_avg': {'precision': 0.845575959933222, 'recall': 0.845575959933222, 'f1': 0.845575959933222, 'support': None}, 'macro_avg': {'precision': 0.7575379069855986, 'recall': 0.7243128574063826, 'f1': 0.7346247541976424, 'support': None}, 'weighted_avg': {'precision': 0.8436491516434452, 'recall': 0.845575959933222, 'f1': 0.8427514436994997, 'support': None}}
Loss: tensor(6.6641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(12.6339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(11.1972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2278e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 15---------------
Evaluating
				 {'precision': {'supports': 0.9175126903553299, 'contradicts': 0.47540983606557374, 'parts_of_same': 0.7777777777777778}, 'recall': {'supports': 0.8669064748201439, 'contradicts': 0.6373626373626373, 'parts_of_same': 0.8205128205128205}, 'f1': {'supports': 0.8914919852034524, 'contradicts': 0.5446009389671361, 'parts_of_same': 0.7985739750445632}, 'support': {'supports': 834, 'contradicts': 91, 'parts_of_same': 273}, 'micro_avg': {'precision': 0.83889816360601, 'recall': 0.83889816360601, 'f1': 0.83889816360601, 'support': None}, 'macro_avg': {'precision': 0.7235667680662271, 'recall': 0.7749273108985338, 'f1': 0.7448889664050505, 'support': None}, 'weighted_avg': {'precision': 0.8520878231816742, 'recall': 0.83889816360601, 'f1': 0.843968026955638, 'support': None}}
Loss: tensor(1.8299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 16---------------
Evaluating
				 {'precision': {'supports': 0.8937644341801386, 'contradicts': 0.6470588235294118, 'parts_of_same': 0.8143939393939394}, 'recall': {'supports': 0.9280575539568345, 'contradicts': 0.4835164835164835, 'parts_of_same': 0.7875457875457875}, 'f1': {'supports': 0.9105882352941177, 'contradicts': 0.5534591194968553, 'parts_of_same': 0.8007448789571695}, 'support': {'supports': 834, 'contradicts': 91, 'parts_of_same': 273}, 'micro_avg': {'precision': 0.8622704507512521, 'recall': 0.8622704507512521, 'f1': 0.8622704507512521, 'support': None}, 'macro_avg': {'precision': 0.7850723990344965, 'recall': 0.7330399416730352, 'f1': 0.7549307445827141, 'support': None}, 'weighted_avg': {'precision': 0.8569377600183286, 'recall': 0.8622704507512521, 'f1': 0.8584296494697957, 'support': None}}
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 17---------------
Evaluating
				 {'precision': {'supports': 0.9105590062111801, 'contradicts': 0.5903614457831325, 'parts_of_same': 0.7483870967741936}, 'recall': {'supports': 0.8788968824940048, 'contradicts': 0.5384615384615384, 'parts_of_same': 0.8498168498168498}, 'f1': {'supports': 0.8944478340451496, 'contradicts': 0.5632183908045977, 'parts_of_same': 0.7958833619210978}, 'support': {'supports': 834, 'contradicts': 91, 'parts_of_same': 273}, 'micro_avg': {'precision': 0.8464106844741235, 'recall': 0.8464106844741235, 'f1': 0.8464106844741235, 'support': None}, 'macro_avg': {'precision': 0.7497691829228353, 'recall': 0.7557250902574643, 'f1': 0.7511831955902818, 'support': None}, 'weighted_avg': {'precision': 0.8492811186692356, 'recall': 0.8464106844741235, 'f1': 0.8468268154936, 'support': None}}
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1126, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 18---------------
Evaluating
				 {'precision': {'supports': 0.9079118028534371, 'contradicts': 0.5060240963855421, 'parts_of_same': 0.6773255813953488}, 'recall': {'supports': 0.8393285371702638, 'contradicts': 0.46153846153846156, 'parts_of_same': 0.8534798534798534}, 'f1': {'supports': 0.8722741433021807, 'contradicts': 0.4827586206896552, 'parts_of_same': 0.7552674230145866}, 'support': {'supports': 834, 'contradicts': 91, 'parts_of_same': 273}, 'micro_avg': {'precision': 0.8138564273789649, 'recall': 0.8138564273789649, 'f1': 0.8138564273789649, 'support': None}, 'macro_avg': {'precision': 0.6970871602114427, 'recall': 0.7181156173961929, 'f1': 0.7034333956688075, 'support': None}, 'weighted_avg': {'precision': 0.8248384975557438, 'recall': 0.8138564273789649, 'f1': 0.8160231022368609, 'support': None}}
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4516, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 19---------------
Evaluating
				 {'precision': {'supports': 0.8844807467911319, 'contradicts': 0.6176470588235294, 'parts_of_same': 0.7655677655677655}, 'recall': {'supports': 0.9088729016786571, 'contradicts': 0.46153846153846156, 'parts_of_same': 0.7655677655677655}, 'f1': {'supports': 0.8965109402720284, 'contradicts': 0.5283018867924528, 'parts_of_same': 0.7655677655677655}, 'support': {'supports': 834, 'contradicts': 91, 'parts_of_same': 273}, 'micro_avg': {'precision': 0.842237061769616, 'recall': 0.842237061769616, 'f1': 0.842237061769616, 'support': None}, 'macro_avg': {'precision': 0.7558985237274757, 'recall': 0.7119930429282947, 'f1': 0.7301268642107489, 'support': None}, 'weighted_avg': {'precision': 0.8371142113328425, 'recall': 0.842237061769616, 'f1': 0.8387025007387187, 'support': None}}
Loss: tensor(7.0384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 20---------------
Evaluating
				 {'precision': {'supports': 0.917910447761194, 'contradicts': 0.5647058823529412, 'parts_of_same': 0.7540453074433657}, 'recall': {'supports': 0.8848920863309353, 'contradicts': 0.5274725274725275, 'parts_of_same': 0.8534798534798534}, 'f1': {'supports': 0.9010989010989011, 'contradicts': 0.5454545454545454, 'parts_of_same': 0.8006872852233677}, 'support': {'supports': 834, 'contradicts': 91, 'parts_of_same': 273}, 'micro_avg': {'precision': 0.8505843071786311, 'recall': 0.8505843071786311, 'f1': 0.8505843071786311, 'support': None}, 'macro_avg': {'precision': 0.7455538791858336, 'recall': 0.7552814890944388, 'f1': 0.7490802439256047, 'support': None}, 'weighted_avg': {'precision': 0.8537394972111789, 'recall': 0.8505843071786311, 'f1': 0.8512024006834945, 'support': None}}
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 21---------------
Evaluating
				 {'precision': {'supports': 0.8933333333333333, 'contradicts': 0.4666666666666667, 'parts_of_same': 0.8235294117647058}, 'recall': {'supports': 0.8836930455635491, 'contradicts': 0.6923076923076923, 'parts_of_same': 0.717948717948718}, 'f1': {'supports': 0.8884870403857745, 'contradicts': 0.5575221238938054, 'parts_of_same': 0.767123287671233}, 'support': {'supports': 834, 'contradicts': 91, 'parts_of_same': 273}, 'micro_avg': {'precision': 0.8313856427378965, 'recall': 0.8313856427378965, 'f1': 0.8313856427378965, 'support': None}, 'macro_avg': {'precision': 0.727843137254902, 'recall': 0.7646498186066532, 'f1': 0.7377108173169376, 'support': None}, 'weighted_avg': {'precision': 0.8450168581622965, 'recall': 0.8313856427378965, 'f1': 0.8356906197748907, 'support': None}}
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 22---------------
Evaluating
				 {'precision': {'supports': 0.8857837181044957, 'contradicts': 0.4897959183673469, 'parts_of_same': 0.7545126353790613}, 'recall': {'supports': 0.8741007194244604, 'contradicts': 0.5274725274725275, 'parts_of_same': 0.7655677655677655}, 'f1': {'supports': 0.8799034399517199, 'contradicts': 0.5079365079365079, 'parts_of_same': 0.76}, 'support': {'supports': 834, 'contradicts': 91, 'parts_of_same': 273}, 'micro_avg': {'precision': 0.8230383973288815, 'recall': 0.8230383973288815, 'f1': 0.8230383973288815, 'support': None}, 'macro_avg': {'precision': 0.7100307572836346, 'recall': 0.7223803374882513, 'f1': 0.7159466492960759, 'support': None}, 'weighted_avg': {'precision': 0.8257904832462953, 'recall': 0.8230383973288815, 'f1': 0.8243252847595631, 'support': None}}
Loss: tensor(3.9258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 23---------------
Evaluating
				 {'precision': {'supports': 0.9205479452054794, 'contradicts': 0.39766081871345027, 'parts_of_same': 0.7407407407407407}, 'recall': {'supports': 0.8057553956834532, 'contradicts': 0.7472527472527473, 'parts_of_same': 0.8058608058608059}, 'f1': {'supports': 0.8593350383631713, 'contradicts': 0.5190839694656488, 'parts_of_same': 0.7719298245614035}, 'support': {'supports': 834, 'contradicts': 91, 'parts_of_same': 273}, 'micro_avg': {'precision': 0.8013355592654424, 'recall': 0.8013355592654424, 'f1': 0.8013355592654424, 'support': None}, 'macro_avg': {'precision': 0.6863165015532235, 'recall': 0.7862896495990022, 'f1': 0.7167829441300745, 'support': None}, 'weighted_avg': {'precision': 0.8398550442625342, 'recall': 0.8013355592654424, 'f1': 0.8135717072800684, 'support': None}}
Loss: tensor(0.1095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 24---------------
Evaluating
				 {'precision': {'supports': 0.8964677222898904, 'contradicts': 0.5098039215686274, 'parts_of_same': 0.7854545454545454}, 'recall': {'supports': 0.882494004796163, 'contradicts': 0.5714285714285714, 'parts_of_same': 0.7912087912087912}, 'f1': {'supports': 0.8894259818731117, 'contradicts': 0.5388601036269429, 'parts_of_same': 0.7883211678832116}, 'support': {'supports': 834, 'contradicts': 91, 'parts_of_same': 273}, 'micro_avg': {'precision': 0.8380634390651085, 'recall': 0.8380634390651085, 'f1': 0.8380634390651085, 'support': None}, 'macro_avg': {'precision': 0.7305753964376877, 'recall': 0.7483771224778418, 'f1': 0.7388690844610887, 'support': None}, 'weighted_avg': {'precision': 0.8417991053101873, 'recall': 0.8380634390651085, 'f1': 0.8397572764143102, 'support': None}}
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 25---------------
Evaluating
				 {'precision': {'supports': 0.8968446601941747, 'contradicts': 0.5257731958762887, 'parts_of_same': 0.7870036101083032}, 'recall': {'supports': 0.8860911270983214, 'contradicts': 0.5604395604395604, 'parts_of_same': 0.7985347985347986}, 'f1': {'supports': 0.8914354644149577, 'contradicts': 0.5425531914893617, 'parts_of_same': 0.7927272727272728}, 'support': {'supports': 834, 'contradicts': 91, 'parts_of_same': 273}, 'micro_avg': {'precision': 0.8414023372287145, 'recall': 0.8414023372287145, 'f1': 0.8414023372287145, 'support': None}, 'macro_avg': {'precision': 0.7365404887262555, 'recall': 0.7483551620242267, 'f1': 0.7422386428771973, 'support': None}, 'weighted_avg': {'precision': 0.843627540055301, 'recall': 0.8414023372287145, 'f1': 0.8424407873139834, 'support': None}}
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 26---------------
Evaluating
				 {'precision': {'supports': 0.8946731234866828, 'contradicts': 0.5208333333333334, 'parts_of_same': 0.7862318840579711}, 'recall': {'supports': 0.8860911270983214, 'contradicts': 0.5494505494505495, 'parts_of_same': 0.7948717948717948}, 'f1': {'supports': 0.8903614457831325, 'contradicts': 0.5347593582887702, 'parts_of_same': 0.790528233151184}, 'support': {'supports': 834, 'contradicts': 91, 'parts_of_same': 273}, 'micro_avg': {'precision': 0.8397328881469115, 'recall': 0.8397328881469115, 'f1': 0.8397328881469116, 'support': None}, 'macro_avg': {'precision': 0.7339127802926625, 'recall': 0.7434711571402218, 'f1': 0.7385496790743623, 'support': None}, 'weighted_avg': {'precision': 0.8415647100743346, 'recall': 0.8397328881469115, 'f1': 0.8405999624688513, 'support': None}}
Loss: tensor(3.8009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1779e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 27---------------
Evaluating
				 {'precision': {'supports': 0.892512077294686, 'contradicts': 0.5157894736842106, 'parts_of_same': 0.7854545454545454}, 'recall': {'supports': 0.8860911270983214, 'contradicts': 0.5384615384615384, 'parts_of_same': 0.7912087912087912}, 'f1': {'supports': 0.8892900120336944, 'contradicts': 0.5268817204301075, 'parts_of_same': 0.7883211678832116}, 'support': {'supports': 834, 'contradicts': 91, 'parts_of_same': 273}, 'micro_avg': {'precision': 0.8380634390651085, 'recall': 0.8380634390651085, 'f1': 0.8380634390651085, 'support': None}, 'macro_avg': {'precision': 0.7312520321444808, 'recall': 0.738587152256217, 'f1': 0.7348309667823378, 'support': None}, 'weighted_avg': {'precision': 0.839500004572723, 'recall': 0.8380634390651085, 'f1': 0.8387527424268428, 'support': None}}
Loss: tensor(2.5569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3174e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7708e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 28---------------
Evaluating
				 {'precision': {'supports': 0.8926417370325693, 'contradicts': 0.5157894736842106, 'parts_of_same': 0.7883211678832117}, 'recall': {'supports': 0.8872901678657075, 'contradicts': 0.5384615384615384, 'parts_of_same': 0.7912087912087912}, 'f1': {'supports': 0.8899579073962718, 'contradicts': 0.5268817204301075, 'parts_of_same': 0.7897623400365631}, 'support': {'supports': 834, 'contradicts': 91, 'parts_of_same': 273}, 'micro_avg': {'precision': 0.83889816360601, 'recall': 0.83889816360601, 'f1': 0.83889816360601, 'support': None}, 'macro_avg': {'precision': 0.7322507928666638, 'recall': 0.7389868325120124, 'f1': 0.7355339892876475, 'support': None}, 'weighted_avg': {'precision': 0.8402435138752444, 'recall': 0.83889816360601, 'f1': 0.8395461186624477, 'support': None}}
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 29---------------
Evaluating
				 {'precision': {'supports': 0.8926417370325693, 'contradicts': 0.5157894736842106, 'parts_of_same': 0.7883211678832117}, 'recall': {'supports': 0.8872901678657075, 'contradicts': 0.5384615384615384, 'parts_of_same': 0.7912087912087912}, 'f1': {'supports': 0.8899579073962718, 'contradicts': 0.5268817204301075, 'parts_of_same': 0.7897623400365631}, 'support': {'supports': 834, 'contradicts': 91, 'parts_of_same': 273}, 'micro_avg': {'precision': 0.83889816360601, 'recall': 0.83889816360601, 'f1': 0.83889816360601, 'support': None}, 'macro_avg': {'precision': 0.7322507928666638, 'recall': 0.7389868325120124, 'f1': 0.7355339892876475, 'support': None}, 'weighted_avg': {'precision': 0.8402435138752444, 'recall': 0.83889816360601, 'f1': 0.8395461186624477, 'support': None}}
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3577e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 30---------------
Evaluating
				 {'precision': {'supports': 0.8927710843373494, 'contradicts': 0.5212765957446809, 'parts_of_same': 0.7883211678832117}, 'recall': {'supports': 0.8884892086330936, 'contradicts': 0.5384615384615384, 'parts_of_same': 0.7912087912087912}, 'f1': {'supports': 0.890625, 'contradicts': 0.5297297297297296, 'parts_of_same': 0.7897623400365631}, 'support': {'supports': 834, 'contradicts': 91, 'parts_of_same': 273}, 'micro_avg': {'precision': 0.8397328881469115, 'recall': 0.8397328881469115, 'f1': 0.8397328881469116, 'support': None}, 'macro_avg': {'precision': 0.7341229493217473, 'recall': 0.7393865127678078, 'f1': 0.7367056899220975, 'support': None}, 'weighted_avg': {'precision': 0.8407503617547848, 'recall': 0.8397328881469115, 'f1': 0.8402268566238623, 'support': None}}
Loss: tensor(6.7298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4108e-06, device='cuda:0', grad_fn=<DivBackward0>)


		-------------RUN 3-----------
			------------EPOCH 1---------------
Evaluating
				 {'precision': {'supports': 1.0, 'contradicts': 0.0, 'parts_of_same': 0.14688300597779674}, 'recall': {'supports': 0.0011402508551881414, 'contradicts': 0.0, 'parts_of_same': 0.9885057471264368}, 'f1': {'supports': 0.0022779043280182236, 'contradicts': 0.0, 'parts_of_same': 0.2557620817843866}, 'support': {'supports': 877, 'contradicts': 123, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.14735945485519591, 'recall': 0.14735945485519591, 'f1': 0.14735945485519591, 'support': None}, 'macro_avg': {'precision': 0.38229433532593227, 'recall': 0.3298819993272083, 'f1': 0.08601332870413493, 'support': None}, 'weighted_avg': {'precision': 0.7687884523340176, 'recall': 0.14735945485519591, 'f1': 0.039608453429433775, 'support': None}}
Loss: tensor(1.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 2---------------
Evaluating
				 {'precision': {'supports': 0.9253731343283582, 'contradicts': 0.425531914893617, 'parts_of_same': 0.837037037037037}, 'recall': {'supports': 0.8483466362599772, 'contradicts': 0.8130081300813008, 'parts_of_same': 0.6494252873563219}, 'f1': {'supports': 0.8851873884592504, 'contradicts': 0.558659217877095, 'parts_of_same': 0.7313915857605179}, 'support': {'supports': 877, 'contradicts': 123, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8151618398637138, 'recall': 0.8151618398637138, 'f1': 0.8151618398637137, 'support': None}, 'macro_avg': {'precision': 0.729314028753004, 'recall': 0.7702600178992, 'f1': 0.725079397365621, 'support': None}, 'weighted_avg': {'precision': 0.8599123584176572, 'recall': 0.8151618398637138, 'f1': 0.8281827592844765, 'support': None}}
Loss: tensor(0.2209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 3---------------
Evaluating
				 {'precision': {'supports': 0.9463087248322147, 'contradicts': 0.44660194174757284, 'parts_of_same': 0.6053811659192825}, 'recall': {'supports': 0.8038768529076397, 'contradicts': 0.7479674796747967, 'parts_of_same': 0.7758620689655172}, 'f1': {'supports': 0.8692971639950678, 'contradicts': 0.5592705167173253, 'parts_of_same': 0.6801007556675064}, 'support': {'supports': 877, 'contradicts': 123, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.7938671209540034, 'recall': 0.7938671209540034, 'f1': 0.7938671209540034, 'support': None}, 'macro_avg': {'precision': 0.6660972774996899, 'recall': 0.7759021338493178, 'f1': 0.7028894787932999, 'support': None}, 'weighted_avg': {'precision': 0.843425139167597, 'recall': 0.7938671209540034, 'f1': 0.8087746319131615, 'support': None}}
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 4---------------
Evaluating
				 {'precision': {'supports': 0.9361702127659575, 'contradicts': 0.5511811023622047, 'parts_of_same': 0.43859649122807015}, 'recall': {'supports': 0.7525655644241733, 'contradicts': 0.5691056910569106, 'parts_of_same': 0.8620689655172413}, 'f1': {'supports': 0.8343868520859672, 'contradicts': 0.5599999999999999, 'parts_of_same': 0.5813953488372092}, 'support': {'supports': 877, 'contradicts': 123, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.7495741056218058, 'recall': 0.7495741056218058, 'f1': 0.7495741056218058, 'support': None}, 'macro_avg': {'precision': 0.6419826021187441, 'recall': 0.7279134069994417, 'f1': 0.658594066974392, 'support': None}, 'weighted_avg': {'precision': 0.8220888770527939, 'recall': 0.7495741056218058, 'f1': 0.768143151598865, 'support': None}}
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 5---------------
Evaluating
				 {'precision': {'supports': 0.9280397022332506, 'contradicts': 0.5584415584415584, 'parts_of_same': 0.616822429906542}, 'recall': {'supports': 0.8529076396807298, 'contradicts': 0.6991869918699187, 'parts_of_same': 0.7586206896551724}, 'f1': {'supports': 0.8888888888888888, 'contradicts': 0.6209386281588447, 'parts_of_same': 0.6804123711340205}, 'support': {'supports': 877, 'contradicts': 123, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8228279386712095, 'recall': 0.8228279386712095, 'f1': 0.8228279386712095, 'support': None}, 'macro_avg': {'precision': 0.7011012301937837, 'recall': 0.7702384404019403, 'f1': 0.7300799627272513, 'support': None}, 'weighted_avg': {'precision': 0.8431909994468576, 'recall': 0.8228279386712095, 'f1': 0.8299171715472002, 'support': None}}
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 6---------------
Evaluating
				 {'precision': {'supports': 0.8893756845564075, 'contradicts': 0.6333333333333333, 'parts_of_same': 0.6842105263157895}, 'recall': {'supports': 0.9258836944127709, 'contradicts': 0.4634146341463415, 'parts_of_same': 0.6724137931034483}, 'f1': {'supports': 0.9072625698324023, 'contradicts': 0.5352112676056339, 'parts_of_same': 0.6782608695652174}, 'support': {'supports': 877, 'contradicts': 123, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8398637137989778, 'recall': 0.8398637137989778, 'f1': 0.8398637137989778, 'support': None}, 'macro_avg': {'precision': 0.73563984806851, 'recall': 0.6872373738875202, 'f1': 0.7069115690010844, 'support': None}, 'weighted_avg': {'precision': 0.8321423398082766, 'recall': 0.8398637137989778, 'f1': 0.8343421217741547, 'support': None}}
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 7---------------
Evaluating
				 {'precision': {'supports': 0.9225352112676056, 'contradicts': 0.5416666666666666, 'parts_of_same': 0.7857142857142857}, 'recall': {'supports': 0.8962371721778791, 'contradicts': 0.7398373983739838, 'parts_of_same': 0.6954022988505747}, 'f1': {'supports': 0.9091960670908039, 'contradicts': 0.6254295532646048, 'parts_of_same': 0.7378048780487806}, 'support': {'supports': 877, 'contradicts': 123, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8500851788756388, 'recall': 0.8500851788756388, 'f1': 0.8500851788756388, 'support': None}, 'macro_avg': {'precision': 0.7499720545495193, 'recall': 0.7771589564674791, 'f1': 0.7574768328013964, 'support': None}, 'weighted_avg': {'precision': 0.8623532078330288, 'recall': 0.8500851788756388, 'f1': 0.854063743331064, 'support': None}}
Loss: tensor(7.2965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 8---------------
Evaluating
				 {'precision': {'supports': 0.9141566265060241, 'contradicts': 0.6106194690265486, 'parts_of_same': 0.35768261964735515}, 'recall': {'supports': 0.6921322690992018, 'contradicts': 0.5609756097560976, 'parts_of_same': 0.8160919540229885}, 'f1': {'supports': 0.7878001297858532, 'contradicts': 0.5847457627118644, 'parts_of_same': 0.4973730297723292}, 'support': {'supports': 877, 'contradicts': 123, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.696763202725724, 'recall': 0.696763202725724, 'f1': 0.696763202725724, 'support': None}, 'macro_avg': {'precision': 0.6274862383933093, 'recall': 0.6897332776260959, 'f1': 0.6233063074233489, 'support': None}, 'weighted_avg': {'precision': 0.7998793287518641, 'recall': 0.696763202725724, 'f1': 0.7234815586168126, 'support': None}}
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 9---------------
Evaluating
				 {'precision': {'supports': 0.9174311926605505, 'contradicts': 0.6416666666666667, 'parts_of_same': 0.7032967032967034}, 'recall': {'supports': 0.9111617312072893, 'contradicts': 0.6311475409836066, 'parts_of_same': 0.735632183908046}, 'f1': {'supports': 0.9142857142857143, 'contradicts': 0.6363636363636364, 'parts_of_same': 0.7191011235955056}, 'support': {'supports': 878, 'contradicts': 122, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8560477001703578, 'recall': 0.8560477001703578, 'f1': 0.8560477001703578, 'support': None}, 'macro_avg': {'precision': 0.7541315208746403, 'recall': 0.7593138186996473, 'f1': 0.756583491414952, 'support': None}, 'weighted_avg': {'precision': 0.8570370927282138, 'recall': 0.8560477001703578, 'f1': 0.8564759934283124, 'support': None}}
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 10---------------
Evaluating
				 {'precision': {'supports': 0.9159859976662778, 'contradicts': 0.5390070921985816, 'parts_of_same': 0.6761363636363636}, 'recall': {'supports': 0.8940774487471527, 'contradicts': 0.6229508196721312, 'parts_of_same': 0.6839080459770115}, 'f1': {'supports': 0.9048991354466859, 'contradicts': 0.5779467680608364, 'parts_of_same': 0.68}, 'support': {'supports': 878, 'contradicts': 122, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8347529812606473, 'recall': 0.8347529812606473, 'f1': 0.8347529812606473, 'support': None}, 'macro_avg': {'precision': 0.7103764845004076, 'recall': 0.7336454381320984, 'f1': 0.7209486345025075, 'support': None}, 'weighted_avg': {'precision': 0.8412626051720153, 'recall': 0.8347529812606473, 'f1': 0.8375902441444739, 'support': None}}
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 11---------------
Evaluating
				 {'precision': {'supports': 0.9213075060532687, 'contradicts': 0.5316455696202531, 'parts_of_same': 0.6631578947368421}, 'recall': {'supports': 0.8667425968109339, 'contradicts': 0.6885245901639344, 'parts_of_same': 0.7241379310344828}, 'f1': {'supports': 0.8931924882629109, 'contradicts': 0.5999999999999999, 'parts_of_same': 0.6923076923076923}, 'support': {'supports': 878, 'contradicts': 122, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8270868824531517, 'recall': 0.8270868824531517, 'f1': 0.8270868824531517, 'support': None}, 'macro_avg': {'precision': 0.7053703234701213, 'recall': 0.7598017060031169, 'f1': 0.7285000601902011, 'support': None}, 'weighted_avg': {'precision': 0.84255385306018, 'recall': 0.8270868824531517, 'f1': 0.832951058906622, 'support': None}}
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 12---------------
Evaluating
				 {'precision': {'supports': 0.90625, 'contradicts': 0.5983606557377049, 'parts_of_same': 0.7692307692307693}, 'recall': {'supports': 0.9258836944127709, 'contradicts': 0.5934959349593496, 'parts_of_same': 0.6896551724137931}, 'f1': {'supports': 0.915961646926114, 'contradicts': 0.5959183673469388, 'parts_of_same': 0.7272727272727274}, 'support': {'supports': 877, 'contradicts': 123, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8560477001703578, 'recall': 0.8560477001703578, 'f1': 0.8560477001703578, 'support': None}, 'macro_avg': {'precision': 0.7579471416561581, 'recall': 0.7363449339286379, 'f1': 0.7463842471819268, 'support': None}, 'weighted_avg': {'precision': 0.8536846375654953, 'recall': 0.8560477001703578, 'f1': 0.8544648876348638, 'support': None}}
Loss: tensor(5.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 13---------------
Evaluating
				 {'precision': {'supports': 0.9073869900771775, 'contradicts': 0.6403508771929824, 'parts_of_same': 0.7777777777777778}, 'recall': {'supports': 0.9373576309794989, 'contradicts': 0.5934959349593496, 'parts_of_same': 0.6878612716763006}, 'f1': {'supports': 0.9221288515406163, 'contradicts': 0.6160337552742616, 'parts_of_same': 0.7300613496932514}, 'support': {'supports': 878, 'contradicts': 123, 'parts_of_same': 173}, 'micro_avg': {'precision': 0.8645655877342419, 'recall': 0.8645655877342419, 'f1': 0.8645655877342419, 'support': None}, 'macro_avg': {'precision': 0.7751718816826458, 'recall': 0.739571612538383, 'f1': 0.7560746521693765, 'support': None}, 'weighted_avg': {'precision': 0.8603104691124823, 'recall': 0.8645655877342419, 'f1': 0.861756300722596, 'support': None}}
Loss: tensor(6.3774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 14---------------
Evaluating
				 {'precision': {'supports': 0.9090909090909091, 'contradicts': 0.6403508771929824, 'parts_of_same': 0.7658227848101266}, 'recall': {'supports': 0.935005701254276, 'contradicts': 0.5934959349593496, 'parts_of_same': 0.6954022988505747}, 'f1': {'supports': 0.921866216975829, 'contradicts': 0.6160337552742616, 'parts_of_same': 0.7289156626506024}, 'support': {'supports': 877, 'contradicts': 123, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8637137989778535, 'recall': 0.8637137989778535, 'f1': 0.8637137989778535, 'support': None}, 'macro_avg': {'precision': 0.7717548570313394, 'recall': 0.7413013116880668, 'f1': 0.7556052116335644, 'support': None}, 'weighted_avg': {'precision': 0.8597010645012148, 'recall': 0.8637137989778535, 'f1': 0.8612267031411764, 'support': None}}
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 15---------------
Evaluating
				 {'precision': {'supports': 0.9137737961926092, 'contradicts': 0.6239316239316239, 'parts_of_same': 0.7621951219512195}, 'recall': {'supports': 0.9304446978335233, 'contradicts': 0.5934959349593496, 'parts_of_same': 0.7183908045977011}, 'f1': {'supports': 0.9220338983050848, 'contradicts': 0.6083333333333334, 'parts_of_same': 0.7396449704142011}, 'support': {'supports': 877, 'contradicts': 123, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8637137989778535, 'recall': 0.8637137989778535, 'f1': 0.8637137989778535, 'support': None}, 'macro_avg': {'precision': 0.7666335140251509, 'recall': 0.7474438124635246, 'f1': 0.7566707340175398, 'support': None}, 'weighted_avg': {'precision': 0.8609413630528281, 'recall': 0.8637137989778535, 'f1': 0.8621353949451707, 'support': None}}
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7750e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 16---------------
Evaluating
				 {'precision': {'supports': 0.9136771300448431, 'contradicts': 0.6239316239316239, 'parts_of_same': 0.7575757575757576}, 'recall': {'supports': 0.928246013667426, 'contradicts': 0.5934959349593496, 'parts_of_same': 0.7225433526011561}, 'f1': {'supports': 0.9209039548022598, 'contradicts': 0.6083333333333334, 'parts_of_same': 0.7396449704142012}, 'support': {'supports': 878, 'contradicts': 123, 'parts_of_same': 173}, 'micro_avg': {'precision': 0.862862010221465, 'recall': 0.862862010221465, 'f1': 0.8628620102214649, 'support': None}, 'macro_avg': {'precision': 0.7650615038507415, 'recall': 0.7480951004093105, 'f1': 0.7562940861832649, 'support': None}, 'weighted_avg': {'precision': 0.8603174752841296, 'recall': 0.862862010221465, 'f1': 0.8614457003390468, 'support': None}}
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 17---------------
Evaluating
				 {'precision': {'supports': 0.9136771300448431, 'contradicts': 0.6153846153846154, 'parts_of_same': 0.7575757575757576}, 'recall': {'supports': 0.928246013667426, 'contradicts': 0.5901639344262295, 'parts_of_same': 0.7183908045977011}, 'f1': {'supports': 0.9209039548022598, 'contradicts': 0.602510460251046, 'parts_of_same': 0.7374631268436579}, 'support': {'supports': 878, 'contradicts': 122, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8620102214650767, 'recall': 0.8620102214650767, 'f1': 0.8620102214650767, 'support': None}, 'macro_avg': {'precision': 0.7622125010017387, 'recall': 0.7456002508971188, 'f1': 0.7536258472989878, 'support': None}, 'weighted_avg': {'precision': 0.859543121869231, 'recall': 0.8620102214650767, 'f1': 0.8606290737119321, 'support': None}}
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0368e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 18---------------
Evaluating
				 {'precision': {'supports': 0.9134831460674158, 'contradicts': 0.6134453781512605, 'parts_of_same': 0.7575757575757576}, 'recall': {'supports': 0.927023945267959, 'contradicts': 0.5934959349593496, 'parts_of_same': 0.7183908045977011}, 'f1': {'supports': 0.9202037351443124, 'contradicts': 0.6033057851239669, 'parts_of_same': 0.7374631268436579}, 'support': {'supports': 877, 'contradicts': 123, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8611584327086882, 'recall': 0.8611584327086882, 'f1': 0.8611584327086882, 'support': None}, 'macro_avg': {'precision': 0.7615014272648114, 'recall': 0.7463035616083366, 'f1': 0.7536575490373124, 'support': None}, 'weighted_avg': {'precision': 0.8589409560748811, 'recall': 0.8611584327086882, 'f1': 0.8599181187075011, 'support': None}}
Loss: tensor(9.1365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0174e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3319e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 19---------------
Evaluating
				 {'precision': {'supports': 0.9132882882882883, 'contradicts': 0.6134453781512605, 'parts_of_same': 0.7485029940119761}, 'recall': {'supports': 0.9247434435575826, 'contradicts': 0.5934959349593496, 'parts_of_same': 0.7183908045977011}, 'f1': {'supports': 0.9189801699716714, 'contradicts': 0.6033057851239669, 'parts_of_same': 0.7331378299120234}, 'support': {'supports': 877, 'contradicts': 123, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8594548551959114, 'recall': 0.8594548551959114, 'f1': 0.8594548551959114, 'support': None}, 'macro_avg': {'precision': 0.7584122201505084, 'recall': 0.7455433943715445, 'f1': 0.7518079283358872, 'support': None}, 'weighted_avg': {'precision': 0.8574507080915824, 'recall': 0.8594548551959114, 'f1': 0.8583630349574921, 'support': None}}
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5744e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 20---------------
Evaluating
				 {'precision': {'supports': 0.9143179255918827, 'contradicts': 0.6134453781512605, 'parts_of_same': 0.75}, 'recall': {'supports': 0.9247434435575826, 'contradicts': 0.5934959349593496, 'parts_of_same': 0.7241379310344828}, 'f1': {'supports': 0.9195011337868481, 'contradicts': 0.6033057851239669, 'parts_of_same': 0.736842105263158}, 'support': {'supports': 877, 'contradicts': 123, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8603066439522998, 'recall': 0.8603066439522998, 'f1': 0.8603066439522998, 'support': None}, 'macro_avg': {'precision': 0.7592544345810478, 'recall': 0.747459103183805, 'f1': 0.7532163413913243, 'support': None}, 'weighted_avg': {'precision': 0.8584417395712829, 'recall': 0.8603066439522998, 'f1': 0.8593012199464252, 'support': None}}
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 21---------------
Evaluating
				 {'precision': {'supports': 0.9133858267716536, 'contradicts': 0.6153846153846154, 'parts_of_same': 0.7440476190476191}, 'recall': {'supports': 0.9248291571753986, 'contradicts': 0.5901639344262295, 'parts_of_same': 0.7183908045977011}, 'f1': {'supports': 0.9190718732314658, 'contradicts': 0.602510460251046, 'parts_of_same': 0.7309941520467835}, 'support': {'supports': 878, 'contradicts': 122, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8594548551959114, 'recall': 0.8594548551959114, 'f1': 0.8594548551959114, 'support': None}, 'macro_avg': {'precision': 0.7576060204012961, 'recall': 0.7444612987331097, 'f1': 0.7508588285097652, 'support': None}, 'weighted_avg': {'precision': 0.8573202425014657, 'recall': 0.8594548551959114, 'f1': 0.8583001391005067, 'support': None}}
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1576e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 22---------------
Evaluating
				 {'precision': {'supports': 0.9133858267716536, 'contradicts': 0.6186440677966102, 'parts_of_same': 0.7485029940119761}, 'recall': {'supports': 0.9258836944127709, 'contradicts': 0.5934959349593496, 'parts_of_same': 0.7183908045977011}, 'f1': {'supports': 0.9195922989807475, 'contradicts': 0.6058091286307055, 'parts_of_same': 0.7331378299120234}, 'support': {'supports': 877, 'contradicts': 123, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8603066439522998, 'recall': 0.8603066439522998, 'f1': 0.8603066439522998, 'support': None}, 'macro_avg': {'precision': 0.7601776295267465, 'recall': 0.7459234779899405, 'f1': 0.752846419174492, 'support': None}, 'weighted_avg': {'precision': 0.8580682379691713, 'recall': 0.8603066439522998, 'f1': 0.8590825821400206, 'support': None}}
Loss: tensor(5.4646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2775e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1576e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7345e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3386e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9494e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8817e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 23---------------
Evaluating
				 {'precision': {'supports': 0.9112359550561798, 'contradicts': 0.6153846153846154, 'parts_of_same': 0.7425149700598802}, 'recall': {'supports': 0.9247434435575826, 'contradicts': 0.5853658536585366, 'parts_of_same': 0.7126436781609196}, 'f1': {'supports': 0.9179400113186191, 'contradicts': 0.6, 'parts_of_same': 0.7272727272727273}, 'support': {'supports': 877, 'contradicts': 123, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8577512776831345, 'recall': 0.8577512776831345, 'f1': 0.8577512776831345, 'support': None}, 'macro_avg': {'precision': 0.7563785135002252, 'recall': 0.7409176584590128, 'f1': 0.7484042461971155, 'support': None}, 'weighted_avg': {'precision': 0.8552332581490601, 'recall': 0.8577512776831345, 'f1': 0.856370395631928, 'support': None}}
Loss: tensor(4.5858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2174e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9339e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9339e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8206e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1576e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5012e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 24---------------
Evaluating
				 {'precision': {'supports': 0.9111361079865017, 'contradicts': 0.6153846153846154, 'parts_of_same': 0.7380952380952381}, 'recall': {'supports': 0.9236031927023945, 'contradicts': 0.5853658536585366, 'parts_of_same': 0.7126436781609196}, 'f1': {'supports': 0.9173272933182333, 'contradicts': 0.6, 'parts_of_same': 0.7251461988304094}, 'support': {'supports': 877, 'contradicts': 123, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8568994889267462, 'recall': 0.8568994889267462, 'f1': 0.8568994889267463, 'support': None}, 'macro_avg': {'precision': 0.7548719871554518, 'recall': 0.740537574840617, 'f1': 0.7474911640495475, 'support': None}, 'weighted_avg': {'precision': 0.8545036165460317, 'recall': 0.8568994889267462, 'f1': 0.8555975083786898, 'support': None}}
Loss: tensor(1.3306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0174e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7684e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3386e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0627e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9494e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4247e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7801e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7345e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6756e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9582e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2592e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4063e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8294e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8633e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7801e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2775e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7006e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7867e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9494e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2341e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6756e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7801e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2437e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1392e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2174e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 25---------------
Evaluating
				 {'precision': {'supports': 0.9111361079865017, 'contradicts': 0.6153846153846154, 'parts_of_same': 0.7380952380952381}, 'recall': {'supports': 0.9236031927023945, 'contradicts': 0.5853658536585366, 'parts_of_same': 0.7126436781609196}, 'f1': {'supports': 0.9173272933182333, 'contradicts': 0.6, 'parts_of_same': 0.7251461988304094}, 'support': {'supports': 877, 'contradicts': 123, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8568994889267462, 'recall': 0.8568994889267462, 'f1': 0.8568994889267463, 'support': None}, 'macro_avg': {'precision': 0.7548719871554518, 'recall': 0.740537574840617, 'f1': 0.7474911640495475, 'support': None}, 'weighted_avg': {'precision': 0.8545036165460317, 'recall': 0.8568994889267462, 'f1': 0.8555975083786898, 'support': None}}
Loss: tensor(2.0924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3725e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6057e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9339e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7345e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6057e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7006e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4423e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4924e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7867e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7278e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5961e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0965e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7006e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6484e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3629e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7801e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9155e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6756e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9494e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8206e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9582e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1576e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8294e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9920e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5535e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2775e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9155e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3725e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5004e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7006e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0965e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4924e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7867e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8545e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9766e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5873e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9766e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8624e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 26---------------
Evaluating
				 {'precision': {'supports': 0.9124579124579124, 'contradicts': 0.6153846153846154, 'parts_of_same': 0.7469879518072289}, 'recall': {'supports': 0.9259681093394078, 'contradicts': 0.5901639344262295, 'parts_of_same': 0.7126436781609196}, 'f1': {'supports': 0.9191633691351047, 'contradicts': 0.602510460251046, 'parts_of_same': 0.7294117647058824}, 'support': {'supports': 878, 'contradicts': 122, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8594548551959114, 'recall': 0.8594548551959114, 'f1': 0.8594548551959114, 'support': None}, 'macro_avg': {'precision': 0.758276826549919, 'recall': 0.7429252406421855, 'f1': 0.7503618646973443, 'support': None}, 'weighted_avg': {'precision': 0.8570620731085418, 'recall': 0.8594548551959114, 'f1': 0.8581340385946108, 'support': None}}
Loss: tensor(7.1053e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0531e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1914e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4423e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3725e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7801e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2437e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2253e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1730e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1392e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4151e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5535e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1818e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5873e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6057e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0531e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8294e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3202e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6756e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0174e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9155e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3202e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7278e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8323e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7771e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7278e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7006e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6513e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8633e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5961e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1392e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9059e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5961e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7278e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8198e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9582e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3386e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1392e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6388e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7278e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4423e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4674e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9155e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4578e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4924e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5535e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0627e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3629e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1818e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1818e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1392e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4151e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3725e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8294e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9582e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5961e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9766e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9678e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9678e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1730e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1392e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2775e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1392e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4924e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4924e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9574e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6756e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9494e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2253e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6484e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4423e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 27---------------
Evaluating
				 {'precision': {'supports': 0.910414333706607, 'contradicts': 0.6120689655172413, 'parts_of_same': 0.7454545454545455}, 'recall': {'supports': 0.9259681093394078, 'contradicts': 0.5819672131147541, 'parts_of_same': 0.7068965517241379}, 'f1': {'supports': 0.9181253529079616, 'contradicts': 0.5966386554621848, 'parts_of_same': 0.7256637168141592}, 'support': {'supports': 878, 'contradicts': 122, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8577512776831345, 'recall': 0.8577512776831345, 'f1': 0.8577512776831345, 'support': None}, 'macro_avg': {'precision': 0.7559792815594646, 'recall': 0.7382772913927665, 'f1': 0.7468092417281018, 'support': None}, 'weighted_avg': {'precision': 0.8549619162662653, 'recall': 0.8577512776831345, 'f1': 0.8561920464610225, 'support': None}}
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7249e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4674e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4151e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6814e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4247e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1818e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0627e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5961e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7801e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5012e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6756e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5991e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4674e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8817e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3018e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5439e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3386e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6756e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8294e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9417e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1392e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5961e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7771e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9582e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7867e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6756e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5961e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7006e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9417e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3791e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2253e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6513e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5439e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6388e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9582e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7771e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1730e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3037e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4924e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7249e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9574e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1392e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8633e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6756e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9417e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4423e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8022e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4847e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3725e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3386e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9417e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4151e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6756e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8624e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3386e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7278e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7249e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6513e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0435e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1914e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5439e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5961e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9059e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5439e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3629e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5991e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5012e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7278e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5439e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7801e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8294e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7801e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0965e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2341e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0627e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8971e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6513e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4578e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4578e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6814e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9678e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6756e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2341e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2341e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4063e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 28---------------
Evaluating
				 {'precision': {'supports': 0.9114349775784754, 'contradicts': 0.6153846153846154, 'parts_of_same': 0.7454545454545455}, 'recall': {'supports': 0.9259681093394078, 'contradicts': 0.5901639344262295, 'parts_of_same': 0.7068965517241379}, 'f1': {'supports': 0.9186440677966101, 'contradicts': 0.602510460251046, 'parts_of_same': 0.7256637168141592}, 'support': {'supports': 878, 'contradicts': 122, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.858603066439523, 'recall': 0.858603066439523, 'f1': 0.858603066439523, 'support': None}, 'macro_avg': {'precision': 0.7574247128058788, 'recall': 0.741009531829925, 'f1': 0.7489394149539385, 'support': None}, 'weighted_avg': {'precision': 0.8560697821975429, 'recall': 0.858603066439523, 'f1': 0.857190165589195, 'support': None}}
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4586e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6513e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4674e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9766e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4423e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0781e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6388e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9678e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5439e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9417e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4423e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1914e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4674e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2775e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7607e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9678e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8022e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0869e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6319e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8198e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3194e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2341e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3386e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3629e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9766e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7345e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4247e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3202e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9059e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6657e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3541e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3194e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7161e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7867e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7412e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7607e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6822e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8738e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6657e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6756e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4423e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8294e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8198e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3194e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0548e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8294e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5991e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4423e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5777e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4151e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4423e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2542e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4423e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7278e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0435e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7607e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8198e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0435e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6756e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2358e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9417e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8883e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6756e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2358e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7278e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3037e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8198e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6928e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6657e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2775e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6840e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5978e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3037e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6814e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2358e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9766e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7607e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6513e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7500e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4423e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4916e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8633e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3037e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6388e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3219e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6928e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9059e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6928e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7607e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0531e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9599e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8624e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8738e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8738e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6928e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6388e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4402e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7587e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7249e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9599e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4151e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9059e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5961e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9059e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4423e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7345e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7607e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8110e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4847e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5961e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0548e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9574e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1409e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8738e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4423e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2542e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4578e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7684e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2019e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4847e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6657e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4423e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0730e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1409e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6249e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2019e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1914e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1296e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3037e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9574e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3037e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6388e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8323e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0435e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3037e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0531e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7607e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1576e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6814e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5299e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4423e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2019e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8883e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8624e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7771e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 29---------------
Evaluating
				 {'precision': {'supports': 0.9103139013452914, 'contradicts': 0.6153846153846154, 'parts_of_same': 0.7454545454545455}, 'recall': {'supports': 0.9258836944127709, 'contradicts': 0.5853658536585366, 'parts_of_same': 0.7068965517241379}, 'f1': {'supports': 0.9180327868852459, 'contradicts': 0.6, 'parts_of_same': 0.7256637168141592}, 'support': {'supports': 877, 'contradicts': 123, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.8577512776831345, 'recall': 0.8577512776831345, 'f1': 0.8577512776831345, 'support': None}, 'macro_avg': {'precision': 0.7570510207281508, 'recall': 0.7393820332651484, 'f1': 0.7478988345664684, 'support': None}, 'weighted_avg': {'precision': 0.8549801448732702, 'recall': 0.8577512776831345, 'f1': 0.8562012272777039, 'support': None}}
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2542e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7110e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6388e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5991e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3489e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2358e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6396e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4423e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1409e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8545e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6928e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7249e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7771e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9574e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5777e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8738e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3194e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8624e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3194e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4674e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4578e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3489e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0548e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2019e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4168e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0818e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7771e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3725e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1120e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5299e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8765e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4847e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7278e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2358e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4828e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5029e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0531e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8738e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4168e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0435e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4168e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8294e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9678e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4578e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7801e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3037e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3629e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2628e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2245e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7607e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4168e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6928e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5978e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7771e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0548e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2542e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6319e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8738e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4490e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6249e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6249e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2245e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4578e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7867e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9869e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4438e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5978e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2358e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2358e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3194e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0818e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5004e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3967e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8738e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8738e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3489e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8738e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3629e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1642e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0548e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0531e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4423e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1818e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2542e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4847e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5991e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6249e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6249e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9574e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2358e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2341e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6928e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2358e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7110e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8206e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9574e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5029e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9869e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6657e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6249e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7771e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2628e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3219e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6319e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0818e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7500e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2341e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4151e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9417e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2679e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8059e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4847e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2628e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2358e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6161e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6657e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2628e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2542e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4168e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8323e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2628e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2542e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6319e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8920e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6300e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7249e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2358e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5299e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5796e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6513e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4350e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1409e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2628e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4847e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8738e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4168e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9574e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8059e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6928e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6814e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9574e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4847e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1497e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0818e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0818e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4055e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0259e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0818e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3489e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7607e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7110e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2628e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9869e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6814e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2628e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3037e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8971e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8198e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6249e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9574e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6928e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4438e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8920e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3018e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3037e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8765e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5991e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9869e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6388e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3194e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6161e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5978e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9494e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9599e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2341e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6756e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9417e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2019e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5961e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4578e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1304e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4423e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3629e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4168e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4847e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3943e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0548e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8059e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9781e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8323e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7771e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3194e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4168e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3194e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6756e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4438e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4423e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2810e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0531e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2679e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0818e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0818e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8738e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2628e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3401e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0548e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3194e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7278e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5991e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8738e-07, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 30---------------
Evaluating
				 {'precision': {'supports': 0.910414333706607, 'contradicts': 0.6206896551724138, 'parts_of_same': 0.7454545454545455}, 'recall': {'supports': 0.927023945267959, 'contradicts': 0.5853658536585366, 'parts_of_same': 0.7068965517241379}, 'f1': {'supports': 0.9186440677966102, 'contradicts': 0.602510460251046, 'parts_of_same': 0.7256637168141592}, 'support': {'supports': 877, 'contradicts': 123, 'parts_of_same': 174}, 'micro_avg': {'precision': 0.858603066439523, 'recall': 0.858603066439523, 'f1': 0.858603066439523, 'support': None}, 'macro_avg': {'precision': 0.7588528447778554, 'recall': 0.7397621168835444, 'f1': 0.7489394149539385, 'support': None}, 'weighted_avg': {'precision': 0.8556109788381534, 'recall': 0.858603066439523, 'f1': 0.8569208865367713, 'support': None}}
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7022e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6249e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6657e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5299e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6928e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2542e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7789e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2019e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5978e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5978e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8624e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8738e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6928e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2628e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9574e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7110e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0548e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8624e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5978e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2019e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6657e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0818e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6814e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3629e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9059e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5439e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3759e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3194e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1730e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3194e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0869e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5299e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4438e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8765e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3037e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0548e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5351e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1304e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8624e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4438e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3759e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2628e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3037e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5991e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4438e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0818e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0548e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5991e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2542e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3943e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5212e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7198e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6388e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8059e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6928e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2628e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8059e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0548e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6928e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7587e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0548e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6484e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7607e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2358e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8323e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7607e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4423e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2628e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6928e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6928e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4168e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2358e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4423e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5212e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7801e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7720e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2253e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7198e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4168e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4438e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9574e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4924e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7720e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8294e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0818e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0818e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5004e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6814e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7198e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3725e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4847e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6756e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8832e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7607e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9574e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1208e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0869e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2628e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8624e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7198e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7198e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7720e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9574e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2542e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3194e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2628e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3759e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9574e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9920e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2628e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6249e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8059e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5004e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6388e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4423e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4490e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4423e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0435e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4847e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0818e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7198e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8765e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7198e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2628e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9574e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0818e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4828e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2358e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4847e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4438e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5004e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8738e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6513e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8765e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3943e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8241e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4466e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3759e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2245e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7198e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7278e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3114e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9417e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5796e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5004e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9574e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3194e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8110e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8059e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8738e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2542e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3943e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1949e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0., device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4466e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3194e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6249e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6249e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8765e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4055e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4423e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9398e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0., device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8738e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2628e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8110e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2245e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3106e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8059e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4168e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3202e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3759e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9869e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4168e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3879e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9574e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3943e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9574e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4988e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7198e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2628e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4423e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7720e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8323e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4490e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5865e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7607e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5299e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6513e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4063e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2628e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4055e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9417e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7198e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7198e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4168e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2019e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8765e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8198e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2628e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3194e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4847e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2019e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6212e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0051e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7607e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9310e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9574e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1981e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1679e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3943e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0., device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8738e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9398e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8738e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4423e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5796e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4055e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6756e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7801e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1304e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3106e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6822e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9417e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0548e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3943e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1497e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5689e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8738e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9574e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5299e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-08, device='cuda:0', grad_fn=<DivBackward0>)


		-------------RUN 4-----------
			------------EPOCH 1---------------
Evaluating
				 {'precision': {'supports': 0.8518518518518519, 'contradicts': 0.0, 'parts_of_same': 0.16216216216216217}, 'recall': {'supports': 0.028395061728395062, 'contradicts': 0.0, 'parts_of_same': 0.9940828402366864}, 'f1': {'supports': 0.05495818399044206, 'contradicts': 0.0, 'parts_of_same': 0.278838174273859}, 'support': {'supports': 810, 'contradicts': 85, 'parts_of_same': 169}, 'micro_avg': {'precision': 0.17951127819548873, 'recall': 0.17951127819548873, 'f1': 0.17951127819548873, 'support': None}, 'macro_avg': {'precision': 0.33800467133800466, 'recall': 0.3408259673216938, 'f1': 0.11126545275476701, 'support': None}, 'weighted_avg': {'precision': 0.6742532005689901, 'recall': 0.17951127819548873, 'f1': 0.08612761323734985, 'support': None}}
Loss: tensor(1.6988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 2---------------
Evaluating
				 {'precision': {'supports': 0.9471428571428572, 'contradicts': 0.4645669291338583, 'parts_of_same': 0.6033755274261603}, 'recall': {'supports': 0.8195302843016069, 'contradicts': 0.6941176470588235, 'parts_of_same': 0.8411764705882353}, 'f1': {'supports': 0.878727634194831, 'contradicts': 0.5566037735849056, 'parts_of_same': 0.7027027027027026}, 'support': {'supports': 809, 'contradicts': 85, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.8129699248120301, 'recall': 0.8129699248120301, 'f1': 0.8129699248120301, 'support': None}, 'macro_avg': {'precision': 0.6716951045676253, 'recall': 0.7849414673162219, 'f1': 0.7126780368274798, 'support': None}, 'weighted_avg': {'precision': 0.8536659775069518, 'recall': 0.8129699248120301, 'f1': 0.824869770937777, 'support': None}}
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7728, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 3---------------
Evaluating
				 {'precision': {'supports': 0.9568690095846646, 'contradicts': 0.3212669683257919, 'parts_of_same': 0.6451612903225806}, 'recall': {'supports': 0.7404202719406675, 'contradicts': 0.8352941176470589, 'parts_of_same': 0.8235294117647058}, 'f1': {'supports': 0.834843205574913, 'contradicts': 0.4640522875816993, 'parts_of_same': 0.7235142118863048}, 'support': {'supports': 809, 'contradicts': 85, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.7612781954887218, 'recall': 0.7612781954887218, 'f1': 0.7612781954887218, 'support': None}, 'macro_avg': {'precision': 0.6410990894110123, 'recall': 0.7997479337841441, 'f1': 0.674136568347639, 'support': None}, 'weighted_avg': {'precision': 0.8562896056546283, 'recall': 0.7612781954887218, 'f1': 0.787434223472952, 'support': None}}
Loss: tensor(0.1314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2167, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 4---------------
Evaluating
				 {'precision': {'supports': 0.9325068870523416, 'contradicts': 0.46825396825396826, 'parts_of_same': 0.6415094339622641}, 'recall': {'supports': 0.8368355995055624, 'contradicts': 0.6941176470588235, 'parts_of_same': 0.8}, 'f1': {'supports': 0.8820846905537458, 'contradicts': 0.5592417061611376, 'parts_of_same': 0.7120418848167539}, 'support': {'supports': 809, 'contradicts': 85, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.8195488721804511, 'recall': 0.8195488721804511, 'f1': 0.8195488721804511, 'support': None}, 'macro_avg': {'precision': 0.6807567630895246, 'recall': 0.7769844155214619, 'f1': 0.7177894271772124, 'support': None}, 'weighted_avg': {'precision': 0.848925058929057, 'recall': 0.8195488721804511, 'f1': 0.829125169267411, 'support': None}}
Loss: tensor(0.1335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 5---------------
Evaluating
				 {'precision': {'supports': 0.9428152492668622, 'contradicts': 0.5730337078651685, 'parts_of_same': 0.5187713310580204}, 'recall': {'supports': 0.7948084054388134, 'contradicts': 0.6, 'parts_of_same': 0.8941176470588236}, 'f1': {'supports': 0.8625083836351441, 'contradicts': 0.5862068965517241, 'parts_of_same': 0.6565874730021598}, 'support': {'supports': 809, 'contradicts': 85, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.7951127819548872, 'recall': 0.7951127819548872, 'f1': 0.7951127819548872, 'support': None}, 'macro_avg': {'precision': 0.6782067627300169, 'recall': 0.7629753508325456, 'f1': 0.7017675843963427, 'support': None}, 'weighted_avg': {'precision': 0.8455230527305398, 'recall': 0.7951127819548872, 'f1': 0.8075345291147513, 'support': None}}
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 6---------------
Evaluating
				 {'precision': {'supports': 0.9177377892030848, 'contradicts': 0.51, 'parts_of_same': 0.6989247311827957}, 'recall': {'supports': 0.8825710754017305, 'contradicts': 0.6, 'parts_of_same': 0.7647058823529411}, 'f1': {'supports': 0.8998109640831757, 'contradicts': 0.5513513513513514, 'parts_of_same': 0.7303370786516853}, 'support': {'supports': 809, 'contradicts': 85, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.8411654135338346, 'recall': 0.8411654135338346, 'f1': 0.8411654135338346, 'support': None}, 'macro_avg': {'precision': 0.7088875067952936, 'recall': 0.7490923192515572, 'f1': 0.727166464695404, 'support': None}, 'weighted_avg': {'precision': 0.8502040185774163, 'recall': 0.8411654135338346, 'f1': 0.8448959005441171, 'support': None}}
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 7---------------
Evaluating
				 {'precision': {'supports': 0.926509186351706, 'contradicts': 0.6329113924050633, 'parts_of_same': 0.6278026905829597}, 'recall': {'supports': 0.8726823238566132, 'contradicts': 0.5882352941176471, 'parts_of_same': 0.8235294117647058}, 'f1': {'supports': 0.8987905792488861, 'contradicts': 0.6097560975609757, 'parts_of_same': 0.712468193384224}, 'support': {'supports': 809, 'contradicts': 85, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.8421052631578947, 'recall': 0.8421052631578947, 'f1': 0.8421052631578947, 'support': None}, 'macro_avg': {'precision': 0.729074423113243, 'recall': 0.761482343246322, 'f1': 0.7403382900646953, 'support': None}, 'weighted_avg': {'precision': 0.8553288134511876, 'recall': 0.8421052631578947, 'f1': 0.845930864455216, 'support': None}}
Loss: tensor(2.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6392e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 8---------------
Evaluating
				 {'precision': {'supports': 0.9277929155313351, 'contradicts': 0.42857142857142855, 'parts_of_same': 0.7}, 'recall': {'supports': 0.8407407407407408, 'contradicts': 0.7058823529411765, 'parts_of_same': 0.7869822485207101}, 'f1': {'supports': 0.8821243523316062, 'contradicts': 0.5333333333333333, 'parts_of_same': 0.7409470752089137}, 'support': {'supports': 810, 'contradicts': 85, 'parts_of_same': 169}, 'micro_avg': {'precision': 0.8214285714285714, 'recall': 0.8214285714285714, 'f1': 0.8214285714285714, 'support': None}, 'macro_avg': {'precision': 0.6854547813675879, 'recall': 0.7778684474008758, 'f1': 0.718801586957951, 'support': None}, 'weighted_avg': {'precision': 0.8517301062114219, 'recall': 0.8214285714285714, 'f1': 0.831836573714512, 'support': None}}
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5776, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 9---------------
Evaluating
				 {'precision': {'supports': 0.9326145552560647, 'contradicts': 0.5652173913043478, 'parts_of_same': 0.6173913043478261}, 'recall': {'supports': 0.854320987654321, 'contradicts': 0.611764705882353, 'parts_of_same': 0.8402366863905325}, 'f1': {'supports': 0.8917525773195877, 'contradicts': 0.5875706214689267, 'parts_of_same': 0.711779448621554}, 'support': {'supports': 810, 'contradicts': 85, 'parts_of_same': 169}, 'micro_avg': {'precision': 0.8327067669172933, 'recall': 0.8327067669172933, 'f1': 0.8327067669172933, 'support': None}, 'macro_avg': {'precision': 0.7050744169694129, 'recall': 0.7687741266424021, 'f1': 0.7303675491366896, 'support': None}, 'weighted_avg': {'precision': 0.8531958632077675, 'recall': 0.8327067669172933, 'f1': 0.8388663696153829, 'support': None}}
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 10---------------
Evaluating
				 {'precision': {'supports': 0.9308510638297872, 'contradicts': 0.5789473684210527, 'parts_of_same': 0.631336405529954}, 'recall': {'supports': 0.8641975308641975, 'contradicts': 0.6470588235294118, 'parts_of_same': 0.8106508875739645}, 'f1': {'supports': 0.8962868117797695, 'contradicts': 0.6111111111111113, 'parts_of_same': 0.7098445595854922}, 'support': {'supports': 810, 'contradicts': 85, 'parts_of_same': 169}, 'micro_avg': {'precision': 0.8383458646616542, 'recall': 0.8383458646616542, 'f1': 0.8383458646616542, 'support': None}, 'macro_avg': {'precision': 0.713711612593598, 'recall': 0.773969080655858, 'f1': 0.7390808274921242, 'support': None}, 'weighted_avg': {'precision': 0.8551651696921798, 'recall': 0.8383458646616542, 'f1': 0.8438914403721861, 'support': None}}
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 11---------------
Evaluating
				 {'precision': {'supports': 0.9328767123287671, 'contradicts': 0.48333333333333334, 'parts_of_same': 0.6495327102803738}, 'recall': {'supports': 0.8417799752781211, 'contradicts': 0.6823529411764706, 'parts_of_same': 0.8176470588235294}, 'f1': {'supports': 0.8849902534113061, 'contradicts': 0.5658536585365854, 'parts_of_same': 0.7239583333333334}, 'support': {'supports': 809, 'contradicts': 85, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.825187969924812, 'recall': 0.825187969924812, 'f1': 0.8251879699248119, 'support': None}, 'macro_avg': {'precision': 0.6885809186474914, 'recall': 0.7805933250927071, 'f1': 0.7249340817604083, 'support': None}, 'weighted_avg': {'precision': 0.8516928142433924, 'recall': 0.825187969924812, 'f1': 0.8337665344473901, 'support': None}}
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 12---------------
Evaluating
				 {'precision': {'supports': 0.912932138284251, 'contradicts': 0.573170731707317, 'parts_of_same': 0.6567164179104478}, 'recall': {'supports': 0.8802469135802469, 'contradicts': 0.5529411764705883, 'parts_of_same': 0.7810650887573964}, 'f1': {'supports': 0.896291640477687, 'contradicts': 0.562874251497006, 'parts_of_same': 0.7135135135135134}, 'support': {'supports': 810, 'contradicts': 85, 'parts_of_same': 169}, 'micro_avg': {'precision': 0.8383458646616542, 'recall': 0.8383458646616542, 'f1': 0.8383458646616542, 'support': None}, 'macro_avg': {'precision': 0.7142730959673386, 'recall': 0.7380843929360772, 'f1': 0.7242264684960688, 'support': None}, 'weighted_avg': {'precision': 0.8450936267220216, 'recall': 0.8383458646616542, 'f1': 0.8406243646127404, 'support': None}}
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(12.1990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 13---------------
Evaluating
				 {'precision': {'supports': 0.9147582697201018, 'contradicts': 0.6493506493506493, 'parts_of_same': 0.6567164179104478}, 'recall': {'supports': 0.8887515451174289, 'contradicts': 0.5882352941176471, 'parts_of_same': 0.7764705882352941}, 'f1': {'supports': 0.9015673981191222, 'contradicts': 0.6172839506172839, 'parts_of_same': 0.7115902964959568}, 'support': {'supports': 809, 'contradicts': 85, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.8468045112781954, 'recall': 0.8468045112781954, 'f1': 0.8468045112781954, 'support': None}, 'macro_avg': {'precision': 0.7402751123270663, 'recall': 0.7511524758234568, 'f1': 0.7434805484107877, 'support': None}, 'weighted_avg': {'precision': 0.8523271019202479, 'recall': 0.8468045112781954, 'f1': 0.8485033000800298, 'support': None}}
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(12.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7113e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 14---------------
Evaluating
				 {'precision': {'supports': 0.9216944801026957, 'contradicts': 0.6, 'parts_of_same': 0.676923076923077}, 'recall': {'supports': 0.8875154511742892, 'contradicts': 0.6352941176470588, 'parts_of_same': 0.7764705882352941}, 'f1': {'supports': 0.9042821158690175, 'contradicts': 0.6171428571428571, 'parts_of_same': 0.7232876712328767}, 'support': {'supports': 809, 'contradicts': 85, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.849624060150376, 'recall': 0.849624060150376, 'f1': 0.849624060150376, 'support': None}, 'macro_avg': {'precision': 0.7328725190085909, 'recall': 0.7664267190188806, 'f1': 0.7482375480815838, 'support': None}, 'weighted_avg': {'precision': 0.8568869901127856, 'recall': 0.849624060150376, 'f1': 0.8524250739706458, 'support': None}}
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4027, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 15---------------
Evaluating
				 {'precision': {'supports': 0.9298737727910238, 'contradicts': 0.3385416666666667, 'parts_of_same': 0.7610062893081762}, 'recall': {'supports': 0.8195302843016069, 'contradicts': 0.7647058823529411, 'parts_of_same': 0.711764705882353}, 'f1': {'supports': 0.8712220762155058, 'contradicts': 0.4693140794223827, 'parts_of_same': 0.7355623100303952}, 'support': {'supports': 809, 'contradicts': 85, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.7979323308270677, 'recall': 0.7979323308270677, 'f1': 0.7979323308270677, 'support': None}, 'macro_avg': {'precision': 0.6764739095886222, 'recall': 0.7653336241789671, 'f1': 0.6920328218894278, 'support': None}, 'weighted_avg': {'precision': 0.855653188944544, 'recall': 0.7979323308270677, 'f1': 0.8174398017992612, 'support': None}}
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 16---------------
Evaluating
				 {'precision': {'supports': 0.9279778393351801, 'contradicts': 0.42105263157894735, 'parts_of_same': 0.645933014354067}, 'recall': {'supports': 0.8281829419035847, 'contradicts': 0.6588235294117647, 'parts_of_same': 0.7941176470588235}, 'f1': {'supports': 0.875244937949053, 'contradicts': 0.5137614678899083, 'parts_of_same': 0.712401055408971}, 'support': {'supports': 809, 'contradicts': 85, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.8092105263157895, 'recall': 0.8092105263157895, 'f1': 0.8092105263157895, 'support': None}, 'macro_avg': {'precision': 0.6649878284227314, 'recall': 0.7603747061247242, 'f1': 0.7004691537493107, 'support': None}, 'weighted_avg': {'precision': 0.8424174418670701, 'recall': 0.8092105263157895, 'f1': 0.8203487396531496, 'support': None}}
Loss: tensor(0.3185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 17---------------
Evaluating
				 {'precision': {'supports': 0.9418777943368107, 'contradicts': 0.49523809523809526, 'parts_of_same': 0.5138888888888888}, 'recall': {'supports': 0.7812113720642769, 'contradicts': 0.611764705882353, 'parts_of_same': 0.8705882352941177}, 'f1': {'supports': 0.8540540540540541, 'contradicts': 0.5473684210526316, 'parts_of_same': 0.6462882096069869}, 'support': {'supports': 809, 'contradicts': 85, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.7819548872180451, 'recall': 0.7819548872180451, 'f1': 0.7819548872180451, 'support': None}, 'macro_avg': {'precision': 0.6503349261545983, 'recall': 0.7545214377469159, 'f1': 0.6825702282378909, 'support': None}, 'weighted_avg': {'precision': 0.8378153052864934, 'recall': 0.7819548872180451, 'f1': 0.7963581213838262, 'support': None}}
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 18---------------
Evaluating
				 {'precision': {'supports': 0.9353507565337001, 'contradicts': 0.4351145038167939, 'parts_of_same': 0.6601941747572816}, 'recall': {'supports': 0.8405438813349815, 'contradicts': 0.6705882352941176, 'parts_of_same': 0.8}, 'f1': {'supports': 0.8854166666666667, 'contradicts': 0.5277777777777778, 'parts_of_same': 0.723404255319149}, 'support': {'supports': 809, 'contradicts': 85, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.8204887218045113, 'recall': 0.8204887218045113, 'f1': 0.8204887218045113, 'support': None}, 'macro_avg': {'precision': 0.6768864783692585, 'recall': 0.7703773722096997, 'f1': 0.7121995665878645, 'support': None}, 'weighted_avg': {'precision': 0.8514252862489932, 'recall': 0.8204887218045113, 'f1': 0.8309604491059208, 'support': None}}
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1444e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 19---------------
Evaluating
				 {'precision': {'supports': 0.928476821192053, 'contradicts': 0.5813953488372093, 'parts_of_same': 0.6278026905829597}, 'recall': {'supports': 0.8665018541409147, 'contradicts': 0.5882352941176471, 'parts_of_same': 0.8235294117647058}, 'f1': {'supports': 0.8964194373401535, 'contradicts': 0.5847953216374269, 'parts_of_same': 0.712468193384224}, 'support': {'supports': 809, 'contradicts': 85, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.8374060150375939, 'recall': 0.8374060150375939, 'f1': 0.8374060150375939, 'support': None}, 'macro_avg': {'precision': 0.7125582868707406, 'recall': 0.7594221866744225, 'f1': 0.7312276507872681, 'support': None}, 'weighted_avg': {'precision': 0.852709408265636, 'recall': 0.8374060150375939, 'f1': 0.8421339473897402, 'support': None}}
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 20---------------
Evaluating
				 {'precision': {'supports': 0.9274406332453826, 'contradicts': 0.5882352941176471, 'parts_of_same': 0.6244343891402715}, 'recall': {'supports': 0.8689740420271941, 'contradicts': 0.5882352941176471, 'parts_of_same': 0.8117647058823529}, 'f1': {'supports': 0.8972559029993619, 'contradicts': 0.5882352941176471, 'parts_of_same': 0.7058823529411764}, 'support': {'supports': 809, 'contradicts': 85, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.8374060150375939, 'recall': 0.8374060150375939, 'f1': 0.8374060150375939, 'support': None}, 'macro_avg': {'precision': 0.7133701055011005, 'recall': 0.7563246806757314, 'f1': 0.7304578500193951, 'support': None}, 'weighted_avg': {'precision': 0.8519298105727074, 'recall': 0.8374060150375939, 'f1': 0.8419925051940638, 'support': None}}
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 21---------------
Evaluating
				 {'precision': {'supports': 0.9262187088274044, 'contradicts': 0.5882352941176471, 'parts_of_same': 0.6272727272727273}, 'recall': {'supports': 0.8689740420271941, 'contradicts': 0.5882352941176471, 'parts_of_same': 0.8117647058823529}, 'f1': {'supports': 0.8966836734693877, 'contradicts': 0.5882352941176471, 'parts_of_same': 0.7076923076923078}, 'support': {'supports': 809, 'contradicts': 85, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.8374060150375939, 'recall': 0.8374060150375939, 'f1': 0.8374060150375939, 'support': None}, 'macro_avg': {'precision': 0.7139089100725929, 'recall': 0.7563246806757314, 'f1': 0.7308704250931143, 'support': None}, 'weighted_avg': {'precision': 0.8514542284565166, 'recall': 0.8374060150375939, 'f1': 0.8418466016394991, 'support': None}}
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1790e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 22---------------
Evaluating
				 {'precision': {'supports': 0.9262187088274044, 'contradicts': 0.5813953488372093, 'parts_of_same': 0.6255707762557078}, 'recall': {'supports': 0.8679012345679012, 'contradicts': 0.5882352941176471, 'parts_of_same': 0.8106508875739645}, 'f1': {'supports': 0.8961121733588273, 'contradicts': 0.5847953216374269, 'parts_of_same': 0.7061855670103093}, 'support': {'supports': 810, 'contradicts': 85, 'parts_of_same': 169}, 'micro_avg': {'precision': 0.8364661654135338, 'recall': 0.8364661654135338, 'f1': 0.8364661654135339, 'support': None}, 'macro_avg': {'precision': 0.7110616113067739, 'recall': 0.7555958054198376, 'f1': 0.7290310206688545, 'support': None}, 'weighted_avg': {'precision': 0.8509184398388863, 'recall': 0.8364661654135338, 'f1': 0.8410750221659528, 'support': None}}
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7076e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 23---------------
Evaluating
				 {'precision': {'supports': 0.9262187088274044, 'contradicts': 0.5882352941176471, 'parts_of_same': 0.6272727272727273}, 'recall': {'supports': 0.8689740420271941, 'contradicts': 0.5882352941176471, 'parts_of_same': 0.8117647058823529}, 'f1': {'supports': 0.8966836734693877, 'contradicts': 0.5882352941176471, 'parts_of_same': 0.7076923076923078}, 'support': {'supports': 809, 'contradicts': 85, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.8374060150375939, 'recall': 0.8374060150375939, 'f1': 0.8374060150375939, 'support': None}, 'macro_avg': {'precision': 0.7139089100725929, 'recall': 0.7563246806757314, 'f1': 0.7308704250931143, 'support': None}, 'weighted_avg': {'precision': 0.8514542284565166, 'recall': 0.8374060150375939, 'f1': 0.8418466016394991, 'support': None}}
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6401e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 24---------------
Evaluating
				 {'precision': {'supports': 0.9262187088274044, 'contradicts': 0.5813953488372093, 'parts_of_same': 0.6301369863013698}, 'recall': {'supports': 0.8689740420271941, 'contradicts': 0.5882352941176471, 'parts_of_same': 0.8117647058823529}, 'f1': {'supports': 0.8966836734693877, 'contradicts': 0.5847953216374269, 'parts_of_same': 0.7095115681233933}, 'support': {'supports': 809, 'contradicts': 85, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.8374060150375939, 'recall': 0.8374060150375939, 'f1': 0.8374060150375939, 'support': None}, 'macro_avg': {'precision': 0.7125836813219945, 'recall': 0.7563246806757314, 'f1': 0.7303301877434026, 'support': None}, 'weighted_avg': {'precision': 0.8513654396275995, 'recall': 0.8374060150375939, 'f1': 0.8418624631173806, 'support': None}}
Loss: tensor(8.3336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 25---------------
Evaluating
				 {'precision': {'supports': 0.9277266754270697, 'contradicts': 0.5813953488372093, 'parts_of_same': 0.6359447004608295}, 'recall': {'supports': 0.8716049382716049, 'contradicts': 0.5952380952380952, 'parts_of_same': 0.8117647058823529}, 'f1': {'supports': 0.8987905792488861, 'contradicts': 0.5882352941176471, 'parts_of_same': 0.7131782945736435}, 'support': {'supports': 810, 'contradicts': 84, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.8402255639097744, 'recall': 0.8402255639097744, 'f1': 0.8402255639097744, 'support': None}, 'macro_avg': {'precision': 0.7150222415750362, 'recall': 0.7595359131306845, 'f1': 0.7334013893133923, 'support': None}, 'weighted_avg': {'precision': 0.8537654280795047, 'recall': 0.8402255639097744, 'f1': 0.8446169586231197, 'support': None}}
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5519e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 26---------------
Evaluating
				 {'precision': {'supports': 0.926412614980289, 'contradicts': 0.5813953488372093, 'parts_of_same': 0.6359447004608295}, 'recall': {'supports': 0.8714462299134734, 'contradicts': 0.5882352941176471, 'parts_of_same': 0.8117647058823529}, 'f1': {'supports': 0.8980891719745223, 'contradicts': 0.5847953216374269, 'parts_of_same': 0.7131782945736435}, 'support': {'supports': 809, 'contradicts': 85, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.8392857142857143, 'recall': 0.8392857142857143, 'f1': 0.8392857142857143, 'support': None}, 'macro_avg': {'precision': 0.7145842214261093, 'recall': 0.7571487433044911, 'f1': 0.7320209293951976, 'support': None}, 'weighted_avg': {'precision': 0.8524407981659377, 'recall': 0.8392857142857143, 'f1': 0.8435169666767757, 'support': None}}
Loss: tensor(3.1737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1018e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 27---------------
Evaluating
				 {'precision': {'supports': 0.926605504587156, 'contradicts': 0.5813953488372093, 'parts_of_same': 0.641860465116279}, 'recall': {'supports': 0.8739184177997528, 'contradicts': 0.5882352941176471, 'parts_of_same': 0.8117647058823529}, 'f1': {'supports': 0.8994910941475827, 'contradicts': 0.5847953216374269, 'parts_of_same': 0.716883116883117}, 'support': {'supports': 809, 'contradicts': 85, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.8411654135338346, 'recall': 0.8411654135338346, 'f1': 0.8411654135338346, 'support': None}, 'macro_avg': {'precision': 0.7166204395135481, 'recall': 0.757972805933251, 'f1': 0.7337231775560422, 'support': None}, 'weighted_avg': {'precision': 0.8535326474924243, 'recall': 0.8411654135338346, 'f1': 0.8451748377581819, 'support': None}}
Loss: tensor(3.1001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6718e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 28---------------
Evaluating
				 {'precision': {'supports': 0.9267015706806283, 'contradicts': 0.5813953488372093, 'parts_of_same': 0.6448598130841121}, 'recall': {'supports': 0.8751545117428925, 'contradicts': 0.5882352941176471, 'parts_of_same': 0.8117647058823529}, 'f1': {'supports': 0.9001907183725366, 'contradicts': 0.5847953216374269, 'parts_of_same': 0.71875}, 'support': {'supports': 809, 'contradicts': 85, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.8421052631578947, 'recall': 0.8421052631578947, 'f1': 0.8421052631578947, 'support': None}, 'macro_avg': {'precision': 0.7176522442006498, 'recall': 0.7583848372476307, 'f1': 0.7345786800033212, 'support': None}, 'weighted_avg': {'precision': 0.8540849093572276, 'recall': 0.8421052631578947, 'f1': 0.8460050690813566, 'support': None}}
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6174e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 29---------------
Evaluating
				 {'precision': {'supports': 0.9267015706806283, 'contradicts': 0.5882352941176471, 'parts_of_same': 0.641860465116279}, 'recall': {'supports': 0.8751545117428925, 'contradicts': 0.5882352941176471, 'parts_of_same': 0.8117647058823529}, 'f1': {'supports': 0.9001907183725366, 'contradicts': 0.5882352941176471, 'parts_of_same': 0.716883116883117}, 'support': {'supports': 809, 'contradicts': 85, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.8421052631578947, 'recall': 0.8421052631578947, 'f1': 0.8421052631578947, 'support': None}, 'macro_avg': {'precision': 0.7189324433048515, 'recall': 0.7583848372476307, 'f1': 0.7351030431244335, 'support': None}, 'weighted_avg': {'precision': 0.8541521144270636, 'recall': 0.8421052631578947, 'f1': 0.8459815987157068, 'support': None}}
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 30---------------
Evaluating
				 {'precision': {'supports': 0.926605504587156, 'contradicts': 0.5813953488372093, 'parts_of_same': 0.641860465116279}, 'recall': {'supports': 0.8739184177997528, 'contradicts': 0.5882352941176471, 'parts_of_same': 0.8117647058823529}, 'f1': {'supports': 0.8994910941475827, 'contradicts': 0.5847953216374269, 'parts_of_same': 0.716883116883117}, 'support': {'supports': 809, 'contradicts': 85, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.8411654135338346, 'recall': 0.8411654135338346, 'f1': 0.8411654135338346, 'support': None}, 'macro_avg': {'precision': 0.7166204395135481, 'recall': 0.757972805933251, 'f1': 0.7337231775560422, 'support': None}, 'weighted_avg': {'precision': 0.8535326474924243, 'recall': 0.8411654135338346, 'f1': 0.8451748377581819, 'support': None}}
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6513e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4247e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3965e-06, device='cuda:0', grad_fn=<DivBackward0>)


		-------------RUN 5-----------
			------------EPOCH 1---------------
Evaluating
				 {'precision': {'supports': 0.6989374262101535, 'contradicts': 0.0, 'parts_of_same': 0.1842818428184282}, 'recall': {'supports': 0.6788990825688074, 'contradicts': 0.0, 'parts_of_same': 0.28936170212765955}, 'f1': {'supports': 0.6887725421756835, 'contradicts': 0.0, 'parts_of_same': 0.2251655629139073}, 'support': {'supports': 872, 'contradicts': 109, 'parts_of_same': 235}, 'micro_avg': {'precision': 0.5427631578947368, 'recall': 0.5427631578947368, 'f1': 0.5427631578947368, 'support': None}, 'macro_avg': {'precision': 0.29440642300952724, 'recall': 0.3227535948988223, 'f1': 0.3046460350298636, 'support': None}, 'weighted_avg': {'precision': 0.5368253854585399, 'recall': 0.5427631578947368, 'f1': 0.5374371414983259, 'support': None}}
Loss: tensor(0.2921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 2---------------
Evaluating
				 {'precision': {'supports': 0.9584487534626038, 'contradicts': 0.5877862595419847, 'parts_of_same': 0.6088154269972452}, 'recall': {'supports': 0.7935779816513762, 'contradicts': 0.7064220183486238, 'parts_of_same': 0.9404255319148936}, 'f1': {'supports': 0.8682559598494354, 'contradicts': 0.6416666666666666, 'parts_of_same': 0.7391304347826089}, 'support': {'supports': 872, 'contradicts': 109, 'parts_of_same': 235}, 'micro_avg': {'precision': 0.8141447368421053, 'recall': 0.8141447368421053, 'f1': 0.8141447368421053, 'support': None}, 'macro_avg': {'precision': 0.7183501466672779, 'recall': 0.8134751773049645, 'f1': 0.749684353766237, 'support': None}, 'weighted_avg': {'precision': 0.8576543097482068, 'recall': 0.8141447368421053, 'f1': 0.822990555780664, 'support': None}}
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5493, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 3---------------
Evaluating
				 {'precision': {'supports': 0.9842105263157894, 'contradicts': 0.32, 'parts_of_same': 0.6358381502890174}, 'recall': {'supports': 0.643348623853211, 'contradicts': 0.8807339449541285, 'parts_of_same': 0.9361702127659575}, 'f1': {'supports': 0.7780859916782246, 'contradicts': 0.46943765281173594, 'parts_of_same': 0.7573149741824441}, 'support': {'supports': 872, 'contradicts': 109, 'parts_of_same': 235}, 'micro_avg': {'precision': 0.7212171052631579, 'recall': 0.7212171052631579, 'f1': 0.7212171052631579, 'support': None}, 'macro_avg': {'precision': 0.6466828922016022, 'recall': 0.8200842605244323, 'f1': 0.6682795395574681, 'support': None}, 'weighted_avg': {'precision': 0.8573466646918483, 'recall': 0.7212171052631579, 'f1': 0.7464051873624714, 'support': None}}
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 4---------------
Evaluating
				 {'precision': {'supports': 0.9352869352869353, 'contradicts': 0.5294117647058824, 'parts_of_same': 0.7991803278688525}, 'recall': {'supports': 0.8774341351660939, 'contradicts': 0.7431192660550459, 'parts_of_same': 0.8333333333333334}, 'f1': {'supports': 0.905437352245863, 'contradicts': 0.6183206106870228, 'parts_of_same': 0.8158995815899582}, 'support': {'supports': 873, 'contradicts': 109, 'parts_of_same': 234}, 'micro_avg': {'precision': 0.8569078947368421, 'recall': 0.8569078947368421, 'f1': 0.8569078947368421, 'support': None}, 'macro_avg': {'precision': 0.7546263426205568, 'recall': 0.817962244851491, 'f1': 0.7798858481742813, 'support': None}, 'weighted_avg': {'precision': 0.8727134651149238, 'recall': 0.8569078947368421, 'f1': 0.8624706062233338, 'support': None}}
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 5---------------
Evaluating
				 {'precision': {'supports': 0.9653179190751445, 'contradicts': 0.4052863436123348, 'parts_of_same': 0.6936026936026936}, 'recall': {'supports': 0.7660550458715596, 'contradicts': 0.8440366972477065, 'parts_of_same': 0.8765957446808511}, 'f1': {'supports': 0.8542199488491048, 'contradicts': 0.5476190476190476, 'parts_of_same': 0.7744360902255639}, 'support': {'supports': 872, 'contradicts': 109, 'parts_of_same': 235}, 'micro_avg': {'precision': 0.7944078947368421, 'recall': 0.7944078947368421, 'f1': 0.7944078947368421, 'support': None}, 'macro_avg': {'precision': 0.6880689854300576, 'recall': 0.8288958292667057, 'f1': 0.7254250288979054, 'support': None}, 'weighted_avg': {'precision': 0.8626069653650523, 'recall': 0.7944078947368421, 'f1': 0.8113180532811702, 'support': None}}
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 6---------------
Evaluating
				 {'precision': {'supports': 0.9482535575679172, 'contradicts': 0.457286432160804, 'parts_of_same': 0.8237704918032787}, 'recall': {'supports': 0.8405963302752294, 'contradicts': 0.8348623853211009, 'parts_of_same': 0.8553191489361702}, 'f1': {'supports': 0.8911854103343466, 'contradicts': 0.5909090909090909, 'parts_of_same': 0.8392484342379958}, 'support': {'supports': 872, 'contradicts': 109, 'parts_of_same': 235}, 'micro_avg': {'precision': 0.8429276315789473, 'recall': 0.8429276315789473, 'f1': 0.8429276315789473, 'support': None}, 'macro_avg': {'precision': 0.743103493844, 'recall': 0.8435926215108335, 'f1': 0.7737809784938111, 'support': None}, 'weighted_avg': {'precision': 0.8801869974329951, 'recall': 0.8429276315789473, 'f1': 0.854232031880403, 'support': None}}
Loss: tensor(6.5267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 7---------------
Evaluating
				 {'precision': {'supports': 0.9335664335664335, 'contradicts': 0.7701149425287356, 'parts_of_same': 0.7822878228782287}, 'recall': {'supports': 0.9185779816513762, 'contradicts': 0.6146788990825688, 'parts_of_same': 0.902127659574468}, 'f1': {'supports': 0.9260115606936417, 'contradicts': 0.6836734693877551, 'parts_of_same': 0.8379446640316204}, 'support': {'supports': 872, 'contradicts': 109, 'parts_of_same': 235}, 'micro_avg': {'precision': 0.8881578947368421, 'recall': 0.8881578947368421, 'f1': 0.8881578947368421, 'support': None}, 'macro_avg': {'precision': 0.8286563996577994, 'recall': 0.811794846769471, 'f1': 0.815876564704339, 'support': None}, 'weighted_avg': {'precision': 0.8896793562351529, 'recall': 0.8881578947368421, 'f1': 0.8872693134338419, 'support': None}}
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 8---------------
Evaluating
				 {'precision': {'supports': 0.9223638470451911, 'contradicts': 0.7126436781609196, 'parts_of_same': 0.7669172932330827}, 'recall': {'supports': 0.9117983963344788, 'contradicts': 0.5688073394495413, 'parts_of_same': 0.8717948717948718}, 'f1': {'supports': 0.9170506912442397, 'contradicts': 0.6326530612244898, 'parts_of_same': 0.8160000000000001}, 'support': {'supports': 873, 'contradicts': 109, 'parts_of_same': 234}, 'micro_avg': {'precision': 0.8733552631578947, 'recall': 0.8733552631578947, 'f1': 0.8733552631578947, 'support': None}, 'macro_avg': {'precision': 0.8006416061463978, 'recall': 0.7841335358596306, 'f1': 0.7885679174895767, 'support': None}, 'weighted_avg': {'precision': 0.8736516825711624, 'recall': 0.8733552631578947, 'f1': 0.8721122015869167, 'support': None}}
Loss: tensor(6.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1181e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 9---------------
Evaluating
				 {'precision': {'supports': 0.9254437869822485, 'contradicts': 0.75, 'parts_of_same': 0.7050847457627119}, 'recall': {'supports': 0.8967889908256881, 'contradicts': 0.5229357798165137, 'parts_of_same': 0.8851063829787233}, 'f1': {'supports': 0.9108910891089109, 'contradicts': 0.6162162162162163, 'parts_of_same': 0.7849056603773584}, 'support': {'supports': 872, 'contradicts': 109, 'parts_of_same': 235}, 'micro_avg': {'precision': 0.8610197368421053, 'recall': 0.8610197368421053, 'f1': 0.8610197368421053, 'support': None}, 'macro_avg': {'precision': 0.7935095109149867, 'recall': 0.768277051206975, 'f1': 0.7706709885674953, 'support': None}, 'weighted_avg': {'precision': 0.8671314946568733, 'recall': 0.8610197368421053, 'f1': 0.8601294633710668, 'support': None}}
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 10---------------
Evaluating
				 {'precision': {'supports': 0.9570469798657718, 'contradicts': 0.538961038961039, 'parts_of_same': 0.6750788643533123}, 'recall': {'supports': 0.8176605504587156, 'contradicts': 0.7614678899082569, 'parts_of_same': 0.9106382978723404}, 'f1': {'supports': 0.8818800247371675, 'contradicts': 0.6311787072243346, 'parts_of_same': 0.7753623188405798}, 'support': {'supports': 872, 'contradicts': 109, 'parts_of_same': 235}, 'micro_avg': {'precision': 0.8305921052631579, 'recall': 0.8305921052631579, 'f1': 0.8305921052631579, 'support': None}, 'macro_avg': {'precision': 0.7236956277267077, 'recall': 0.8299222460797709, 'f1': 0.7628070169340274, 'support': None}, 'weighted_avg': {'precision': 0.8650783329052094, 'recall': 0.8305921052631579, 'f1': 0.8388223730146372, 'support': None}}
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 11---------------
Evaluating
				 {'precision': {'supports': 0.9354037267080745, 'contradicts': 0.5514705882352942, 'parts_of_same': 0.7163636363636363}, 'recall': {'supports': 0.8625429553264605, 'contradicts': 0.6944444444444444, 'parts_of_same': 0.8382978723404255}, 'f1': {'supports': 0.8974970202622169, 'contradicts': 0.6147540983606558, 'parts_of_same': 0.7725490196078432}, 'support': {'supports': 873, 'contradicts': 108, 'parts_of_same': 235}, 'micro_avg': {'precision': 0.8429276315789473, 'recall': 0.8429276315789473, 'f1': 0.8429276315789473, 'support': None}, 'macro_avg': {'precision': 0.7344126504356683, 'recall': 0.7984284240371101, 'f1': 0.7616000460769053, 'support': None}, 'weighted_avg': {'precision': 0.8589734633972166, 'recall': 0.8429276315789473, 'f1': 0.8482379612826557, 'support': None}}
Loss: tensor(4.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 12---------------
Evaluating
				 {'precision': {'supports': 0.9349693251533743, 'contradicts': 0.6666666666666666, 'parts_of_same': 0.6815286624203821}, 'recall': {'supports': 0.8738532110091743, 'contradicts': 0.5321100917431193, 'parts_of_same': 0.9106382978723404}, 'f1': {'supports': 0.9033787788974511, 'contradicts': 0.5918367346938775, 'parts_of_same': 0.7795992714025501}, 'support': {'supports': 872, 'contradicts': 109, 'parts_of_same': 235}, 'micro_avg': {'precision': 0.850328947368421, 'recall': 0.850328947368421, 'f1': 0.850328947368421, 'support': None}, 'macro_avg': {'precision': 0.7610548847468076, 'recall': 0.7722005335415446, 'f1': 0.7582715949979596, 'support': None}, 'weighted_avg': {'precision': 0.8619400936424332, 'recall': 0.850328947368421, 'f1': 0.8515315197860275, 'support': None}}
Loss: tensor(6.7235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(10.4731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 13---------------
Evaluating
				 {'precision': {'supports': 0.9301775147928995, 'contradicts': 0.6759259259259259, 'parts_of_same': 0.7718631178707225}, 'recall': {'supports': 0.9013761467889908, 'contradicts': 0.6697247706422018, 'parts_of_same': 0.8638297872340426}, 'f1': {'supports': 0.9155503785672685, 'contradicts': 0.6728110599078341, 'parts_of_same': 0.8152610441767069}, 'support': {'supports': 872, 'contradicts': 109, 'parts_of_same': 235}, 'micro_avg': {'precision': 0.8733552631578947, 'recall': 0.8733552631578947, 'f1': 0.8733552631578947, 'support': None}, 'macro_avg': {'precision': 0.7926555195298493, 'recall': 0.811643568221745, 'f1': 0.8012074942172699, 'support': None}, 'weighted_avg': {'precision': 0.8767915719777584, 'recall': 0.8733552631578947, 'f1': 0.8744100995247847, 'support': None}}
Loss: tensor(6.7598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4718e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 14---------------
Evaluating
				 {'precision': {'supports': 0.9247311827956989, 'contradicts': 0.6302521008403361, 'parts_of_same': 0.7538461538461538}, 'recall': {'supports': 0.8876146788990825, 'contradicts': 0.6880733944954128, 'parts_of_same': 0.8340425531914893}, 'f1': {'supports': 0.9057928613224108, 'contradicts': 0.6578947368421052, 'parts_of_same': 0.7919191919191919}, 'support': {'supports': 872, 'contradicts': 109, 'parts_of_same': 235}, 'micro_avg': {'precision': 0.859375, 'recall': 0.859375, 'f1': 0.859375, 'support': None}, 'macro_avg': {'precision': 0.769609812494063, 'recall': 0.8032435421953282, 'f1': 0.7852022633612359, 'support': None}, 'weighted_avg': {'precision': 0.8653099642625758, 'recall': 0.859375, 'f1': 0.8615648943173863, 'support': None}}
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 15---------------
Evaluating
				 {'precision': {'supports': 0.9294947121034077, 'contradicts': 0.6666666666666666, 'parts_of_same': 0.7782258064516129}, 'recall': {'supports': 0.9060710194730813, 'contradicts': 0.7155963302752294, 'parts_of_same': 0.8247863247863247}, 'f1': {'supports': 0.9176334106728538, 'contradicts': 0.6902654867256638, 'parts_of_same': 0.8008298755186722}, 'support': {'supports': 873, 'contradicts': 109, 'parts_of_same': 234}, 'micro_avg': {'precision': 0.8733552631578947, 'recall': 0.8733552631578947, 'f1': 0.8733552631578947, 'support': None}, 'macro_avg': {'precision': 0.7914623950738958, 'recall': 0.8154845581782117, 'f1': 0.8029095909723966, 'support': None}, 'weighted_avg': {'precision': 0.8768259778311012, 'recall': 0.8733552631578947, 'f1': 0.8747755727317994, 'support': None}}
Loss: tensor(6.6423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 16---------------
Evaluating
				 {'precision': {'supports': 0.9347037484885127, 'contradicts': 0.626984126984127, 'parts_of_same': 0.7566539923954373}, 'recall': {'supports': 0.8864678899082569, 'contradicts': 0.7247706422018348, 'parts_of_same': 0.8468085106382979}, 'f1': {'supports': 0.9099470276633314, 'contradicts': 0.672340425531915, 'parts_of_same': 0.7991967871485944}, 'support': {'supports': 872, 'contradicts': 109, 'parts_of_same': 235}, 'micro_avg': {'precision': 0.8643092105263158, 'recall': 0.8643092105263158, 'f1': 0.8643092105263158, 'support': None}, 'macro_avg': {'precision': 0.7727806226226924, 'recall': 0.8193490142494632, 'f1': 0.7938280801146136, 'support': None}, 'weighted_avg': {'precision': 0.8727110417238327, 'recall': 0.8643092105263158, 'f1': 0.8672451969451672, 'support': None}}
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7265, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 17---------------
Evaluating
				 {'precision': {'supports': 0.9301470588235294, 'contradicts': 0.5214723926380368, 'parts_of_same': 0.7637130801687764}, 'recall': {'supports': 0.8704128440366973, 'contradicts': 0.7798165137614679, 'parts_of_same': 0.7702127659574468}, 'f1': {'supports': 0.8992890995260664, 'contradicts': 0.625, 'parts_of_same': 0.7669491525423728}, 'support': {'supports': 872, 'contradicts': 109, 'parts_of_same': 235}, 'micro_avg': {'precision': 0.8429276315789473, 'recall': 0.8429276315789473, 'f1': 0.8429276315789473, 'support': None}, 'macro_avg': {'precision': 0.7384441772101141, 'recall': 0.8068140412518706, 'f1': 0.7637460840228131, 'support': None}, 'weighted_avg': {'precision': 0.8613497532329987, 'recall': 0.8429276315789473, 'f1': 0.8491267645017989, 'support': None}}
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 18---------------
Evaluating
				 {'precision': {'supports': 0.9262782401902497, 'contradicts': 0.7011494252873564, 'parts_of_same': 0.7118055555555556}, 'recall': {'supports': 0.8923253150057274, 'contradicts': 0.5596330275229358, 'parts_of_same': 0.8760683760683761}, 'f1': {'supports': 0.9089848308051343, 'contradicts': 0.6224489795918366, 'parts_of_same': 0.78544061302682}, 'support': {'supports': 873, 'contradicts': 109, 'parts_of_same': 234}, 'micro_avg': {'precision': 0.859375, 'recall': 0.859375, 'f1': 0.859375, 'support': None}, 'macro_avg': {'precision': 0.7797444070110539, 'recall': 0.7760089061990131, 'f1': 0.772291474474597, 'support': None}, 'weighted_avg': {'precision': 0.8648262261861923, 'recall': 0.859375, 'f1': 0.8595261509183129, 'support': None}}
Loss: tensor(8.9263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 19---------------
Evaluating
				 {'precision': {'supports': 0.9255989911727617, 'contradicts': 0.5586206896551724, 'parts_of_same': 0.6870503597122302}, 'recall': {'supports': 0.841743119266055, 'contradicts': 0.7431192660550459, 'parts_of_same': 0.8127659574468085}, 'f1': {'supports': 0.8816816816816817, 'contradicts': 0.6377952755905512, 'parts_of_same': 0.7446393762183235}, 'support': {'supports': 872, 'contradicts': 109, 'parts_of_same': 235}, 'micro_avg': {'precision': 0.8273026315789473, 'recall': 0.8273026315789473, 'f1': 0.8273026315789473, 'support': None}, 'macro_avg': {'precision': 0.7237566801800547, 'recall': 0.7992094475893031, 'f1': 0.7547054444968522, 'support': None}, 'weighted_avg': {'precision': 0.8466026398087468, 'recall': 0.8273026315789473, 'f1': 0.8333358263791962, 'support': None}}
Loss: tensor(3.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 20---------------
Evaluating
				 {'precision': {'supports': 0.9230769230769231, 'contradicts': 0.6050420168067226, 'parts_of_same': 0.7358490566037735}, 'recall': {'supports': 0.8797250859106529, 'contradicts': 0.6605504587155964, 'parts_of_same': 0.8333333333333334}, 'f1': {'supports': 0.9008797653958944, 'contradicts': 0.6315789473684209, 'parts_of_same': 0.781563126252505}, 'support': {'supports': 873, 'contradicts': 109, 'parts_of_same': 234}, 'micro_avg': {'precision': 0.8511513157894737, 'recall': 0.8511513157894737, 'f1': 0.8511513157894737, 'support': None}, 'macro_avg': {'precision': 0.7546559988291398, 'recall': 0.791202959319861, 'f1': 0.7713406130056067, 'support': None}, 'weighted_avg': {'precision': 0.8585398132593501, 'recall': 0.8511513157894737, 'f1': 0.8537795328921545, 'support': None}}
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5430e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 21---------------
Evaluating
				 {'precision': {'supports': 0.9330900243309003, 'contradicts': 0.608, 'parts_of_same': 0.758364312267658}, 'recall': {'supports': 0.8795871559633027, 'contradicts': 0.6972477064220184, 'parts_of_same': 0.8680851063829788}, 'f1': {'supports': 0.9055489964580874, 'contradicts': 0.6495726495726496, 'parts_of_same': 0.8095238095238094}, 'support': {'supports': 872, 'contradicts': 109, 'parts_of_same': 235}, 'micro_avg': {'precision': 0.8610197368421053, 'recall': 0.8610197368421053, 'f1': 0.8610197368421053, 'support': None}, 'macro_avg': {'precision': 0.766484778866186, 'recall': 0.8149733229227666, 'f1': 0.7882151518515155, 'support': None}, 'weighted_avg': {'precision': 0.8701826600324379, 'recall': 0.8610197368421053, 'f1': 0.8640462491389524, 'support': None}}
Loss: tensor(7.4024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 22---------------
Evaluating
				 {'precision': {'supports': 0.9008908685968819, 'contradicts': 0.7160493827160493, 'parts_of_same': 0.7848101265822784}, 'recall': {'supports': 0.9277522935779816, 'contradicts': 0.5321100917431193, 'parts_of_same': 0.7914893617021277}, 'f1': {'supports': 0.9141242937853108, 'contradicts': 0.6105263157894737, 'parts_of_same': 0.7881355932203389}, 'support': {'supports': 872, 'contradicts': 109, 'parts_of_same': 235}, 'micro_avg': {'precision': 0.865953947368421, 'recall': 0.865953947368421, 'f1': 0.865953947368421, 'support': None}, 'macro_avg': {'precision': 0.8005834592984034, 'recall': 0.7504505823410762, 'f1': 0.7709287342650412, 'support': None}, 'weighted_avg': {'precision': 0.8618886512165838, 'recall': 0.865953947368421, 'f1': 0.8625621850399863, 'support': None}}
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 23---------------
Evaluating
				 {'precision': {'supports': 0.9305373525557011, 'contradicts': 0.4293193717277487, 'parts_of_same': 0.7519083969465649}, 'recall': {'supports': 0.8132875143184422, 'contradicts': 0.7522935779816514, 'parts_of_same': 0.8418803418803419}, 'f1': {'supports': 0.8679706601466992, 'contradicts': 0.5466666666666667, 'parts_of_same': 0.7943548387096774}, 'support': {'supports': 873, 'contradicts': 109, 'parts_of_same': 234}, 'micro_avg': {'precision': 0.8133223684210527, 'recall': 0.8133223684210527, 'f1': 0.8133223684210527, 'support': None}, 'macro_avg': {'precision': 0.7039217070766716, 'recall': 0.8024871447268119, 'f1': 0.7363307218410146, 'support': None}, 'weighted_avg': {'precision': 0.8512347740007795, 'recall': 0.8133223684210527, 'f1': 0.825003359566447, 'support': None}}
Loss: tensor(0.2132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 24---------------
Evaluating
				 {'precision': {'supports': 0.9215686274509803, 'contradicts': 0.6697247706422018, 'parts_of_same': 0.8083333333333333}, 'recall': {'supports': 0.9162844036697247, 'contradicts': 0.6697247706422018, 'parts_of_same': 0.825531914893617}, 'f1': {'supports': 0.9189189189189189, 'contradicts': 0.6697247706422018, 'parts_of_same': 0.816842105263158}, 'support': {'supports': 872, 'contradicts': 109, 'parts_of_same': 235}, 'micro_avg': {'precision': 0.8766447368421053, 'recall': 0.8766447368421053, 'f1': 0.8766447368421053, 'support': None}, 'macro_avg': {'precision': 0.7998755771421718, 'recall': 0.8038470297351812, 'f1': 0.8018285982747596, 'support': None}, 'weighted_avg': {'precision': 0.8771103424922599, 'recall': 0.8766447368421053, 'f1': 0.8768545987122857, 'support': None}}
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 25---------------
Evaluating
				 {'precision': {'supports': 0.9394673123486683, 'contradicts': 0.5985401459854015, 'parts_of_same': 0.7905138339920948}, 'recall': {'supports': 0.8888888888888888, 'contradicts': 0.7592592592592593, 'parts_of_same': 0.851063829787234}, 'f1': {'supports': 0.9134785167745733, 'contradicts': 0.6693877551020408, 'parts_of_same': 0.819672131147541}, 'support': {'supports': 873, 'contradicts': 108, 'parts_of_same': 235}, 'micro_avg': {'precision': 0.8700657894736842, 'recall': 0.8700657894736842, 'f1': 0.8700657894736842, 'support': None}, 'macro_avg': {'precision': 0.7761737641087215, 'recall': 0.8330706593117941, 'f1': 0.8008461343413851, 'support': None}, 'weighted_avg': {'precision': 0.8804013572655865, 'recall': 0.8700657894736842, 'f1': 0.8736707019036966, 'support': None}}
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 26---------------
Evaluating
				 {'precision': {'supports': 0.9044368600682594, 'contradicts': 0.625, 'parts_of_same': 0.8}, 'recall': {'supports': 0.9106529209621993, 'contradicts': 0.6481481481481481, 'parts_of_same': 0.7659574468085106}, 'f1': {'supports': 0.9075342465753424, 'contradicts': 0.6363636363636364, 'parts_of_same': 0.7826086956521738}, 'support': {'supports': 873, 'contradicts': 108, 'parts_of_same': 235}, 'micro_avg': {'precision': 0.859375, 'recall': 0.859375, 'f1': 0.859375, 'support': None}, 'macro_avg': {'precision': 0.7764789533560865, 'recall': 0.774919505306286, 'f1': 0.7755021928637175, 'support': None}, 'weighted_avg': {'precision': 0.8594353444404528, 'recall': 0.859375, 'f1': 0.8593073301528023, 'support': None}}
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 27---------------
Evaluating
				 {'precision': {'supports': 0.9440298507462687, 'contradicts': 0.6470588235294118, 'parts_of_same': 0.7133105802047781}, 'recall': {'supports': 0.8704128440366973, 'contradicts': 0.7064220183486238, 'parts_of_same': 0.8893617021276595}, 'f1': {'supports': 0.905727923627685, 'contradicts': 0.6754385964912281, 'parts_of_same': 0.7916666666666667}, 'support': {'supports': 872, 'contradicts': 109, 'parts_of_same': 235}, 'micro_avg': {'precision': 0.859375, 'recall': 0.859375, 'f1': 0.859375, 'support': None}, 'macro_avg': {'precision': 0.7681330848268195, 'recall': 0.822065521504327, 'f1': 0.7909443955951933, 'support': None}, 'weighted_avg': {'precision': 0.8728218979963609, 'recall': 0.859375, 'f1': 0.8630421242496314, 'support': None}}
Loss: tensor(3.6420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 28---------------
Evaluating
				 {'precision': {'supports': 0.9299754299754299, 'contradicts': 0.5932203389830508, 'parts_of_same': 0.7077464788732394}, 'recall': {'supports': 0.8671248568155785, 'contradicts': 0.6422018348623854, 'parts_of_same': 0.8589743589743589}, 'f1': {'supports': 0.8974510966212211, 'contradicts': 0.6167400881057269, 'parts_of_same': 0.776061776061776}, 'support': {'supports': 873, 'contradicts': 109, 'parts_of_same': 234}, 'micro_avg': {'precision': 0.8453947368421053, 'recall': 0.8453947368421053, 'f1': 0.8453947368421053, 'support': None}, 'macro_avg': {'precision': 0.7436474159439067, 'recall': 0.7894336835507744, 'f1': 0.7634176535962413, 'support': None}, 'weighted_avg': {'precision': 0.8570248711957573, 'recall': 0.8453947368421053, 'f1': 0.8489292208489357, 'support': None}}
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 29---------------
Evaluating
				 {'precision': {'supports': 0.9324324324324325, 'contradicts': 0.6052631578947368, 'parts_of_same': 0.7083333333333334}, 'recall': {'supports': 0.8694158075601375, 'contradicts': 0.6330275229357798, 'parts_of_same': 0.8717948717948718}, 'f1': {'supports': 0.8998221695317131, 'contradicts': 0.6188340807174889, 'parts_of_same': 0.7816091954022988}, 'support': {'supports': 873, 'contradicts': 109, 'parts_of_same': 234}, 'micro_avg': {'precision': 0.8486842105263158, 'recall': 0.8486842105263158, 'f1': 0.8486842105263158, 'support': None}, 'macro_avg': {'precision': 0.7486763078868343, 'recall': 0.7914127340969297, 'f1': 0.7667551485505003, 'support': None}, 'weighted_avg': {'precision': 0.8599812481283223, 'recall': 0.8486842105263158, 'f1': 0.8518866945094817, 'support': None}}
Loss: tensor(8.5051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 30---------------
Evaluating
				 {'precision': {'supports': 0.9198998748435544, 'contradicts': 0.4962962962962963, 'parts_of_same': 0.6843971631205674}, 'recall': {'supports': 0.8428899082568807, 'contradicts': 0.6146788990825688, 'parts_of_same': 0.8212765957446808}, 'f1': {'supports': 0.8797127468581687, 'contradicts': 0.5491803278688524, 'parts_of_same': 0.746615087040619}, 'support': {'supports': 872, 'contradicts': 109, 'parts_of_same': 235}, 'micro_avg': {'precision': 0.8182565789473685, 'recall': 0.8182565789473685, 'f1': 0.8182565789473685, 'support': None}, 'macro_avg': {'precision': 0.7001977780868062, 'recall': 0.7596151343613767, 'f1': 0.72516938725588, 'support': None}, 'weighted_avg': {'precision': 0.8364163819845469, 'recall': 0.8182565789473685, 'f1': 0.8243624312932347, 'support': None}}
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Train size: 50 Test size: 50
	Tokenizer: allenai/longformer-base-4096 Model: allenai/longformer-base-4096


		-------------RUN 1-----------
			------------EPOCH 1---------------
Evaluating
				 {'precision': {'supports': 0.0, 'contradicts': 0.0, 'parts_of_same': 0.1517216642754663}, 'recall': {'supports': 0.0, 'contradicts': 0.0, 'parts_of_same': 1.0}, 'f1': {'supports': 0.0, 'contradicts': 0.0, 'parts_of_same': 0.2634693241980691}, 'support': {'supports': 2128, 'contradicts': 237, 'parts_of_same': 423}, 'micro_avg': {'precision': 0.1517216642754663, 'recall': 0.1517216642754663, 'f1': 0.1517216642754663, 'support': None}, 'macro_avg': {'precision': 0.050573888091822096, 'recall': 0.3333333333333333, 'f1': 0.08782310806602305, 'support': None}, 'weighted_avg': {'precision': 0.023019463410517305, 'recall': 0.1517216642754663, 'f1': 0.039974004352863426, 'support': None}}
Loss: tensor(0.3703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 2---------------
Evaluating
				 {'precision': {'supports': 0.9516819571865444, 'contradicts': 0.2925824175824176, 'parts_of_same': 0.7270588235294118}, 'recall': {'supports': 0.731203007518797, 'contradicts': 0.8987341772151899, 'parts_of_same': 0.7304964539007093}, 'f1': {'supports': 0.826999734254584, 'contradicts': 0.44145077720207254, 'parts_of_same': 0.7287735849056604}, 'support': {'supports': 2128, 'contradicts': 237, 'parts_of_same': 423}, 'micro_avg': {'precision': 0.7453371592539455, 'recall': 0.7453371592539455, 'f1': 0.7453371592539455, 'support': None}, 'macro_avg': {'precision': 0.6571077327661246, 'recall': 0.786811212878232, 'f1': 0.6657413654541057, 'support': None}, 'weighted_avg': {'precision': 0.8615735725297491, 'recall': 0.7453371592539455, 'f1': 0.7793222722760905, 'support': None}}
Loss: tensor(0.1616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 3---------------
Evaluating
				 {'precision': {'supports': 0.9858757062146892, 'contradicts': 0.2883263009845288, 'parts_of_same': 0.38817733990147785}, 'recall': {'supports': 0.49201127819548873, 'contradicts': 0.8649789029535865, 'parts_of_same': 0.9314420803782506}, 'f1': {'supports': 0.6564263322884012, 'contradicts': 0.43248945147679324, 'parts_of_same': 0.5479833101529903}, 'support': {'supports': 2128, 'contradicts': 237, 'parts_of_same': 423}, 'micro_avg': {'precision': 0.5903873744619799, 'recall': 0.5903873744619799, 'f1': 0.5903873744619799, 'support': None}, 'macro_avg': {'precision': 0.5541264490335652, 'recall': 0.7628107538424419, 'f1': 0.5456330313060616, 'support': None}, 'weighted_avg': {'precision': 0.835895211957144, 'recall': 0.5903873744619799, 'f1': 0.6209369351881036, 'support': None}}
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 4---------------
Evaluating
				 {'precision': {'supports': 0.9403217436429684, 'contradicts': 0.44871794871794873, 'parts_of_same': 0.7006369426751592}, 'recall': {'supports': 0.8515037593984962, 'contradicts': 0.7383966244725738, 'parts_of_same': 0.7801418439716312}, 'f1': {'supports': 0.893711467324291, 'contradicts': 0.5582137161084529, 'parts_of_same': 0.738255033557047}, 'support': {'supports': 2128, 'contradicts': 237, 'parts_of_same': 423}, 'micro_avg': {'precision': 0.8310616929698709, 'recall': 0.8310616929698709, 'f1': 0.8310616929698708, 'support': None}, 'macro_avg': {'precision': 0.6965588783453588, 'recall': 0.7900140759475671, 'f1': 0.7300600723299303, 'support': None}, 'weighted_avg': {'precision': 0.8621665176004244, 'recall': 0.8310616929698709, 'f1': 0.8416056428903965, 'support': None}}
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 5---------------
Evaluating
				 {'precision': {'supports': 0.933933933933934, 'contradicts': 0.5283018867924528, 'parts_of_same': 0.7161016949152542}, 'recall': {'supports': 0.8768796992481203, 'contradicts': 0.7088607594936709, 'parts_of_same': 0.7990543735224587}, 'f1': {'supports': 0.9045079980610761, 'contradicts': 0.6054054054054053, 'parts_of_same': 0.7553072625698324}, 'support': {'supports': 2128, 'contradicts': 237, 'parts_of_same': 423}, 'micro_avg': {'precision': 0.8507890961262554, 'recall': 0.8507890961262554, 'f1': 0.8507890961262554, 'support': None}, 'macro_avg': {'precision': 0.7261125052138803, 'recall': 0.7949316107547499, 'f1': 0.755073555345438, 'support': None}, 'weighted_avg': {'precision': 0.8664024302476241, 'recall': 0.8507890961262554, 'f1': 0.856445148142787, 'support': None}}
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 6---------------
Evaluating
				 {'precision': {'supports': 0.9509911894273128, 'contradicts': 0.3771760154738878, 'parts_of_same': 0.7604395604395604}, 'recall': {'supports': 0.8115601503759399, 'contradicts': 0.8227848101265823, 'parts_of_same': 0.817966903073286}, 'f1': {'supports': 0.8757606490872211, 'contradicts': 0.5172413793103449, 'parts_of_same': 0.7881548974943052}, 'support': {'supports': 2128, 'contradicts': 237, 'parts_of_same': 423}, 'micro_avg': {'precision': 0.8134863701578192, 'recall': 0.8134863701578192, 'f1': 0.8134863701578192, 'support': None}, 'macro_avg': {'precision': 0.696202255113587, 'recall': 0.8174372878586027, 'f1': 0.7270523086306238, 'support': None}, 'weighted_avg': {'precision': 0.8733019730396581, 'recall': 0.8134863701578192, 'f1': 0.8319922488501612, 'support': None}}
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 7---------------
Evaluating
				 {'precision': {'supports': 0.9593356242840779, 'contradicts': 0.425531914893617, 'parts_of_same': 0.6042003231017771}, 'recall': {'supports': 0.787124060150376, 'contradicts': 0.759493670886076, 'parts_of_same': 0.8841607565011821}, 'f1': {'supports': 0.8647392875580795, 'contradicts': 0.5454545454545455, 'parts_of_same': 0.7178502879078695}, 'support': {'supports': 2128, 'contradicts': 237, 'parts_of_same': 423}, 'micro_avg': {'precision': 0.7994978479196556, 'recall': 0.7994978479196556, 'f1': 0.7994978479196556, 'support': None}, 'macro_avg': {'precision': 0.6630226207598241, 'recall': 0.810259495845878, 'f1': 0.7093480403068315, 'support': None}, 'weighted_avg': {'precision': 0.8600767607526386, 'recall': 0.7994978479196556, 'f1': 0.8153115505671984, 'support': None}}
Loss: tensor(6.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7684e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 8---------------
Evaluating
				 {'precision': {'supports': 0.9254864736592311, 'contradicts': 0.5478547854785478, 'parts_of_same': 0.828042328042328}, 'recall': {'supports': 0.9163533834586466, 'contradicts': 0.70042194092827, 'parts_of_same': 0.7399527186761229}, 'f1': {'supports': 0.920897284533648, 'contradicts': 0.6148148148148147, 'parts_of_same': 0.7815230961298377}, 'support': {'supports': 2128, 'contradicts': 237, 'parts_of_same': 423}, 'micro_avg': {'precision': 0.8712338593974175, 'recall': 0.8712338593974175, 'f1': 0.8712338593974175, 'support': None}, 'macro_avg': {'precision': 0.7671278623933689, 'recall': 0.7855760143543464, 'f1': 0.7724117318261001, 'support': None}, 'weighted_avg': {'precision': 0.8786006832378638, 'recall': 0.8712338593974175, 'f1': 0.8737319950723227, 'support': None}}
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9030e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 9---------------
Evaluating
				 {'precision': {'supports': 0.9264214046822743, 'contradicts': 0.5704225352112676, 'parts_of_same': 0.7980535279805353}, 'recall': {'supports': 0.9111842105263158, 'contradicts': 0.6835443037974683, 'parts_of_same': 0.7754137115839244}, 'f1': {'supports': 0.9187396351575456, 'contradicts': 0.6218809980806143, 'parts_of_same': 0.7865707434052757}, 'support': {'supports': 2128, 'contradicts': 237, 'parts_of_same': 423}, 'micro_avg': {'precision': 0.8712338593974175, 'recall': 0.8712338593974175, 'f1': 0.8712338593974175, 'support': None}, 'macro_avg': {'precision': 0.7649658226246924, 'recall': 0.7900474086359028, 'f1': 0.7757304588811452, 'support': None}, 'weighted_avg': {'precision': 0.8766827590906444, 'recall': 0.8712338593974175, 'f1': 0.8734516372384484, 'support': None}}
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 10---------------
Evaluating
				 {'precision': {'supports': 0.9394093686354379, 'contradicts': 0.46875, 'parts_of_same': 0.7659090909090909}, 'recall': {'supports': 0.8670112781954887, 'contradicts': 0.759493670886076, 'parts_of_same': 0.7966903073286052}, 'f1': {'supports': 0.9017595307917888, 'contradicts': 0.5797101449275363, 'parts_of_same': 0.7809965237543453}, 'support': {'supports': 2128, 'contradicts': 237, 'parts_of_same': 423}, 'micro_avg': {'precision': 0.8472022955523673, 'recall': 0.8472022955523673, 'f1': 0.8472022955523673, 'support': None}, 'macro_avg': {'precision': 0.7246894865148429, 'recall': 0.8077317521367232, 'f1': 0.7541553998245568, 'support': None}, 'weighted_avg': {'precision': 0.8730761950899417, 'recall': 0.8472022955523673, 'f1': 0.8560606583288526, 'support': None}}
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 11---------------
Evaluating
				 {'precision': {'supports': 0.9338345864661655, 'contradicts': 0.4904109589041096, 'parts_of_same': 0.7616822429906542}, 'recall': {'supports': 0.8754699248120301, 'contradicts': 0.7552742616033755, 'parts_of_same': 0.7706855791962175}, 'f1': {'supports': 0.9037108901285472, 'contradicts': 0.5946843853820598, 'parts_of_same': 0.7661574618096356}, 'support': {'supports': 2128, 'contradicts': 237, 'parts_of_same': 423}, 'micro_avg': {'precision': 0.8493543758967002, 'recall': 0.8493543758967002, 'f1': 0.8493543758967003, 'support': None}, 'macro_avg': {'precision': 0.7286425961203098, 'recall': 0.8004765885372077, 'f1': 0.754850912440081, 'support': None}, 'weighted_avg': {'precision': 0.8700211571181209, 'recall': 0.8493543758967002, 'f1': 0.8565715853208655, 'support': None}}
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 12---------------
Evaluating
				 {'precision': {'supports': 0.9526011560693641, 'contradicts': 0.44680851063829785, 'parts_of_same': 0.5395894428152492}, 'recall': {'supports': 0.7744360902255639, 'contradicts': 0.7088607594936709, 'parts_of_same': 0.8699763593380615}, 'f1': {'supports': 0.8543286677034733, 'contradicts': 0.5481239804241436, 'parts_of_same': 0.6660633484162897}, 'support': {'supports': 2128, 'contradicts': 237, 'parts_of_same': 423}, 'micro_avg': {'precision': 0.7833572453371592, 'recall': 0.7833572453371592, 'f1': 0.7833572453371592, 'support': None}, 'macro_avg': {'precision': 0.6463330365076371, 'recall': 0.7844244030190987, 'f1': 0.6895053321813022, 'support': None}, 'weighted_avg': {'precision': 0.8469423283528456, 'recall': 0.7833572453371592, 'f1': 0.7997351451268306, 'support': None}}
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 13---------------
Evaluating
				 {'precision': {'supports': 0.9510070767555797, 'contradicts': 0.5045871559633027, 'parts_of_same': 0.6041666666666666}, 'recall': {'supports': 0.8209586466165414, 'contradicts': 0.6962025316455697, 'parts_of_same': 0.8912529550827423}, 'f1': {'supports': 0.8812105926860025, 'contradicts': 0.5851063829787234, 'parts_of_same': 0.7201528175740209}, 'support': {'supports': 2128, 'contradicts': 237, 'parts_of_same': 423}, 'micro_avg': {'precision': 0.8210186513629842, 'recall': 0.8210186513629842, 'f1': 0.8210186513629842, 'support': None}, 'macro_avg': {'precision': 0.6865869664618497, 'recall': 0.8028047111149511, 'f1': 0.7288232644129157, 'support': None}, 'weighted_avg': {'precision': 0.8604349767931049, 'recall': 0.8210186513629842, 'f1': 0.8316036570428916, 'support': None}}
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 14---------------
Evaluating
				 {'precision': {'supports': 0.9422343324250682, 'contradicts': 0.35856573705179284, 'parts_of_same': 0.7228381374722838}, 'recall': {'supports': 0.8125, 'contradicts': 0.759493670886076, 'parts_of_same': 0.7706855791962175}, 'f1': {'supports': 0.8725712843805199, 'contradicts': 0.48714479025710417, 'parts_of_same': 0.7459954233409611}, 'support': {'supports': 2128, 'contradicts': 237, 'parts_of_same': 423}, 'micro_avg': {'precision': 0.8016499282639885, 'recall': 0.8016499282639885, 'f1': 0.8016499282639885, 'support': None}, 'macro_avg': {'precision': 0.6745460689830481, 'recall': 0.7808930833607645, 'f1': 0.7019038326595283, 'support': None}, 'weighted_avg': {'precision': 0.859331158978693, 'recall': 0.8016499282639885, 'f1': 0.820602967190067, 'support': None}}
Loss: tensor(0.3111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 15---------------
Evaluating
				 {'precision': {'supports': 0.9329329329329329, 'contradicts': 0.5785123966942148, 'parts_of_same': 0.6459854014598541}, 'recall': {'supports': 0.8759398496240601, 'contradicts': 0.5907172995780591, 'parts_of_same': 0.8368794326241135}, 'f1': {'supports': 0.9035385361124576, 'contradicts': 0.5845511482254697, 'parts_of_same': 0.7291452111225543}, 'support': {'supports': 2128, 'contradicts': 237, 'parts_of_same': 423}, 'micro_avg': {'precision': 0.8457675753228121, 'recall': 0.8457675753228121, 'f1': 0.8457675753228121, 'support': None}, 'macro_avg': {'precision': 0.7191435770290006, 'recall': 0.7678455272754109, 'f1': 0.739078298486827, 'support': None}, 'weighted_avg': {'precision': 0.859268487846244, 'recall': 0.8457675753228121, 'f1': 0.8499630743477713, 'support': None}}
Loss: tensor(3.6256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 16---------------
Evaluating
				 {'precision': {'supports': 0.926491646778043, 'contradicts': 0.5591397849462365, 'parts_of_same': 0.7874396135265701}, 'recall': {'supports': 0.912124060150376, 'contradicts': 0.6582278481012658, 'parts_of_same': 0.7706855791962175}, 'f1': {'supports': 0.9192517167890126, 'contradicts': 0.6046511627906976, 'parts_of_same': 0.7789725209080048}, 'support': {'supports': 2128, 'contradicts': 237, 'parts_of_same': 423}, 'micro_avg': {'precision': 0.8690817790530847, 'recall': 0.8690817790530847, 'f1': 0.8690817790530847, 'support': None}, 'macro_avg': {'precision': 0.7576903484169498, 'recall': 0.7803458291492863, 'f1': 0.7676251334959051, 'support': None}, 'weighted_avg': {'precision': 0.8741668973808009, 'recall': 0.8690817790530847, 'f1': 0.87122501981797, 'support': None}}
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 17---------------
Evaluating
				 {'precision': {'supports': 0.9293320425943853, 'contradicts': 0.5498281786941581, 'parts_of_same': 0.7633410672853829}, 'recall': {'supports': 0.9022556390977443, 'contradicts': 0.6751054852320675, 'parts_of_same': 0.7777777777777778}, 'f1': {'supports': 0.9155937052932761, 'contradicts': 0.6060606060606061, 'parts_of_same': 0.7704918032786885}, 'support': {'supports': 2128, 'contradicts': 237, 'parts_of_same': 423}, 'micro_avg': {'precision': 0.8640602582496413, 'recall': 0.8640602582496413, 'f1': 0.8640602582496413, 'support': None}, 'macro_avg': {'precision': 0.7475004295246421, 'recall': 0.7850463007025299, 'f1': 0.7640487048775236, 'support': None}, 'weighted_avg': {'precision': 0.8718870647249226, 'recall': 0.8640602582496413, 'f1': 0.8672660693283143, 'support': None}}
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 18---------------
Evaluating
				 {'precision': {'supports': 0.9313868613138686, 'contradicts': 0.5469798657718121, 'parts_of_same': 0.7609195402298851}, 'recall': {'supports': 0.8994360902255639, 'contradicts': 0.6877637130801688, 'parts_of_same': 0.7825059101654847}, 'f1': {'supports': 0.9151326798948123, 'contradicts': 0.6093457943925235, 'parts_of_same': 0.7715617715617716}, 'support': {'supports': 2128, 'contradicts': 237, 'parts_of_same': 423}, 'micro_avg': {'precision': 0.8637015781922525, 'recall': 0.8637015781922525, 'f1': 0.8637015781922525, 'support': None}, 'macro_avg': {'precision': 0.7464287557718553, 'recall': 0.7899019044904058, 'f1': 0.7653467486163691, 'support': None}, 'weighted_avg': {'precision': 0.8728459234508871, 'recall': 0.8637015781922525, 'f1': 0.8673557838801358, 'support': None}}
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 19---------------
Evaluating
				 {'precision': {'supports': 0.9327157484154072, 'contradicts': 0.5451505016722408, 'parts_of_same': 0.7625570776255708}, 'recall': {'supports': 0.8989661654135338, 'contradicts': 0.6877637130801688, 'parts_of_same': 0.789598108747045}, 'f1': {'supports': 0.9155300311079205, 'contradicts': 0.6082089552238805, 'parts_of_same': 0.7758420441347271}, 'support': {'supports': 2128, 'contradicts': 237, 'parts_of_same': 423}, 'micro_avg': {'precision': 0.8644189383070301, 'recall': 0.8644189383070301, 'f1': 0.86441893830703, 'support': None}, 'macro_avg': {'precision': 0.7468077759044064, 'recall': 0.7921093290802492, 'f1': 0.7665270101555093, 'support': None}, 'weighted_avg': {'precision': 0.873953165480604, 'recall': 0.8644189383070301, 'f1': 0.8682118411960918, 'support': None}}
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 20---------------
Evaluating
				 {'precision': {'supports': 0.9330073349633252, 'contradicts': 0.5394736842105263, 'parts_of_same': 0.7608200455580866}, 'recall': {'supports': 0.8966165413533834, 'contradicts': 0.6919831223628692, 'parts_of_same': 0.789598108747045}, 'f1': {'supports': 0.914450035945363, 'contradicts': 0.6062846580406654, 'parts_of_same': 0.7749419953596289}, 'support': {'supports': 2128, 'contradicts': 237, 'parts_of_same': 423}, 'micro_avg': {'precision': 0.8629842180774749, 'recall': 0.8629842180774749, 'f1': 0.8629842180774749, 'support': None}, 'macro_avg': {'precision': 0.7444336882439794, 'recall': 0.7927325908210991, 'f1': 0.765225563115219, 'support': None}, 'weighted_avg': {'precision': 0.8734296094802444, 'recall': 0.8629842180774749, 'f1': 0.8670873760704783, 'support': None}}
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2731e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 21---------------
Evaluating
				 {'precision': {'supports': 0.9338559529642332, 'contradicts': 0.5359477124183006, 'parts_of_same': 0.7596371882086168}, 'recall': {'supports': 0.8956766917293233, 'contradicts': 0.6919831223628692, 'parts_of_same': 0.7919621749408984}, 'f1': {'supports': 0.9143679539457903, 'contradicts': 0.6040515653775322, 'parts_of_same': 0.7754629629629629}, 'support': {'supports': 2128, 'contradicts': 237, 'parts_of_same': 423}, 'micro_avg': {'precision': 0.8626255380200861, 'recall': 0.8626255380200861, 'f1': 0.8626255380200861, 'support': None}, 'macro_avg': {'precision': 0.7431469511970502, 'recall': 0.7932073296776969, 'f1': 0.7646274940954285, 'support': None}, 'weighted_avg': {'precision': 0.8735981371460797, 'recall': 0.8626255380200861, 'f1': 0.866913938423404, 'support': None}}
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 22---------------
Evaluating
				 {'precision': {'supports': 0.9343137254901961, 'contradicts': 0.5374592833876222, 'parts_of_same': 0.7596371882086168}, 'recall': {'supports': 0.8956766917293233, 'contradicts': 0.6962025316455697, 'parts_of_same': 0.7919621749408984}, 'f1': {'supports': 0.9145873320537428, 'contradicts': 0.6066176470588237, 'parts_of_same': 0.7754629629629629}, 'support': {'supports': 2128, 'contradicts': 237, 'parts_of_same': 423}, 'micro_avg': {'precision': 0.8629842180774749, 'recall': 0.8629842180774749, 'f1': 0.8629842180774749, 'support': None}, 'macro_avg': {'precision': 0.7438033990288117, 'recall': 0.7946137994385971, 'f1': 0.7655559806918432, 'support': None}, 'weighted_avg': {'precision': 0.8740760360897591, 'recall': 0.8629842180774749, 'f1': 0.8672995187577615, 'support': None}}
Loss: tensor(1.7380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0732e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 23---------------
Evaluating
				 {'precision': {'supports': 0.9338235294117647, 'contradicts': 0.5357142857142857, 'parts_of_same': 0.7613636363636364}, 'recall': {'supports': 0.8952067669172933, 'contradicts': 0.6962025316455697, 'parts_of_same': 0.7919621749408984}, 'f1': {'supports': 0.9141074856046065, 'contradicts': 0.6055045871559633, 'parts_of_same': 0.776361529548088}, 'support': {'supports': 2128, 'contradicts': 237, 'parts_of_same': 423}, 'micro_avg': {'precision': 0.8626255380200861, 'recall': 0.8626255380200861, 'f1': 0.8626255380200861, 'support': None}, 'macro_avg': {'precision': 0.743633817163229, 'recall': 0.7944571578345871, 'f1': 0.765324534102886, 'support': None}, 'weighted_avg': {'precision': 0.8738154858265205, 'recall': 0.8626255380200861, 'f1': 0.8669749797422552, 'support': None}}
Loss: tensor(1.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 24---------------
Evaluating
				 {'precision': {'supports': 0.9337910740559098, 'contradicts': 0.532258064516129, 'parts_of_same': 0.7630979498861048}, 'recall': {'supports': 0.8947368421052632, 'contradicts': 0.6962025316455697, 'parts_of_same': 0.7919621749408984}, 'f1': {'supports': 0.9138468922486201, 'contradicts': 0.6032906764168189, 'parts_of_same': 0.7772621809744781}, 'support': {'supports': 2128, 'contradicts': 237, 'parts_of_same': 423}, 'micro_avg': {'precision': 0.8622668579626973, 'recall': 0.8622668579626973, 'f1': 0.8622668579626973, 'support': None}, 'macro_avg': {'precision': 0.7430490294860478, 'recall': 0.7943005162305771, 'f1': 0.764799916546639, 'support': None}, 'weighted_avg': {'precision': 0.8737600429279486, 'recall': 0.8622668579626973, 'f1': 0.8667245263873938, 'support': None}}
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2174e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 25---------------
Evaluating
				 {'precision': {'supports': 0.9342492639842983, 'contradicts': 0.5305466237942122, 'parts_of_same': 0.7630979498861048}, 'recall': {'supports': 0.8947368421052632, 'contradicts': 0.6962025316455697, 'parts_of_same': 0.7919621749408984}, 'f1': {'supports': 0.9140662506000959, 'contradicts': 0.6021897810218979, 'parts_of_same': 0.7772621809744781}, 'support': {'supports': 2128, 'contradicts': 237, 'parts_of_same': 423}, 'micro_avg': {'precision': 0.8622668579626973, 'recall': 0.8622668579626973, 'f1': 0.8622668579626973, 'support': None}, 'macro_avg': {'precision': 0.7426312792215385, 'recall': 0.7943005162305771, 'f1': 0.7645060708654906, 'support': None}, 'weighted_avg': {'precision': 0.8739642813485069, 'recall': 0.8622668579626973, 'f1': 0.8667983722852936, 'support': None}}
Loss: tensor(3.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1525e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 26---------------
Evaluating
				 {'precision': {'supports': 0.9342492639842983, 'contradicts': 0.532258064516129, 'parts_of_same': 0.7613636363636364}, 'recall': {'supports': 0.8947368421052632, 'contradicts': 0.6962025316455697, 'parts_of_same': 0.7919621749408984}, 'f1': {'supports': 0.9140662506000959, 'contradicts': 0.6032906764168189, 'parts_of_same': 0.776361529548088}, 'support': {'supports': 2128, 'contradicts': 237, 'parts_of_same': 423}, 'micro_avg': {'precision': 0.8622668579626973, 'recall': 0.8622668579626973, 'f1': 0.8622668579626973, 'support': None}, 'macro_avg': {'precision': 0.7426236549546879, 'recall': 0.7943005162305771, 'f1': 0.764572818855001, 'support': None}, 'weighted_avg': {'precision': 0.8738466331530585, 'recall': 0.8622668579626973, 'f1': 0.8667553079579022, 'support': None}}
Loss: tensor(6.4525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2174e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 27---------------
Evaluating
				 {'precision': {'supports': 0.9342169857633775, 'contradicts': 0.532258064516129, 'parts_of_same': 0.7596371882086168}, 'recall': {'supports': 0.894266917293233, 'contradicts': 0.6962025316455697, 'parts_of_same': 0.7919621749408984}, 'f1': {'supports': 0.9138055222088834, 'contradicts': 0.6032906764168189, 'parts_of_same': 0.7754629629629629}, 'support': {'supports': 2128, 'contradicts': 237, 'parts_of_same': 423}, 'micro_avg': {'precision': 0.8619081779053085, 'recall': 0.8619081779053085, 'f1': 0.8619081779053085, 'support': None}, 'macro_avg': {'precision': 0.7420374128293744, 'recall': 0.7941438746265671, 'f1': 0.7641863871962218, 'support': None}, 'weighted_avg': {'precision': 0.8735600565305003, 'recall': 0.8619081779053085, 'f1': 0.8664199694779855, 'support': None}}
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 28---------------
Evaluating
				 {'precision': {'supports': 0.9341846758349706, 'contradicts': 0.532258064516129, 'parts_of_same': 0.7579185520361991}, 'recall': {'supports': 0.893796992481203, 'contradicts': 0.6962025316455697, 'parts_of_same': 0.7919621749408984}, 'f1': {'supports': 0.9135446685878963, 'contradicts': 0.6032906764168189, 'parts_of_same': 0.7745664739884393}, 'support': {'supports': 2128, 'contradicts': 237, 'parts_of_same': 423}, 'micro_avg': {'precision': 0.8615494978479197, 'recall': 0.8615494978479197, 'f1': 0.8615494978479197, 'support': None}, 'macro_avg': {'precision': 0.7414537641290995, 'recall': 0.7939872330225571, 'f1': 0.7638006063310515, 'support': None}, 'weighted_avg': {'precision': 0.8732746409535338, 'recall': 0.8615494978479197, 'f1': 0.8660848506323312, 'support': None}}
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8836e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 29---------------
Evaluating
				 {'precision': {'supports': 0.9346437346437346, 'contradicts': 0.5337620578778135, 'parts_of_same': 0.7579185520361991}, 'recall': {'supports': 0.893796992481203, 'contradicts': 0.70042194092827, 'parts_of_same': 0.7919621749408984}, 'f1': {'supports': 0.9137641124189286, 'contradicts': 0.6058394160583942, 'parts_of_same': 0.7745664739884393}, 'support': {'supports': 2128, 'contradicts': 237, 'parts_of_same': 423}, 'micro_avg': {'precision': 0.8619081779053085, 'recall': 0.8619081779053085, 'f1': 0.8619081779053085, 'support': None}, 'macro_avg': {'precision': 0.7421081148525824, 'recall': 0.7953937027834571, 'f1': 0.7647233341552541, 'support': None}, 'weighted_avg': {'precision': 0.8737528775287738, 'recall': 0.8619081779053085, 'f1': 0.8664690069334395, 'support': None}}
Loss: tensor(3.5176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 30---------------
Evaluating
				 {'precision': {'supports': 0.9346758349705304, 'contradicts': 0.535483870967742, 'parts_of_same': 0.7579185520361991}, 'recall': {'supports': 0.894266917293233, 'contradicts': 0.70042194092827, 'parts_of_same': 0.7919621749408984}, 'f1': {'supports': 0.9140249759846302, 'contradicts': 0.6069469835466179, 'parts_of_same': 0.7745664739884393}, 'support': {'supports': 2128, 'contradicts': 237, 'parts_of_same': 423}, 'micro_avg': {'precision': 0.8622668579626973, 'recall': 0.8622668579626973, 'f1': 0.8622668579626973, 'support': None}, 'macro_avg': {'precision': 0.7426927526581572, 'recall': 0.7955503443874671, 'f1': 0.7651794778398958, 'support': None}, 'weighted_avg': {'precision': 0.873923745246756, 'recall': 0.8622668579626973, 'f1': 0.8667622677521347, 'support': None}}
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)


		-------------RUN 2-----------
			------------EPOCH 1---------------
Evaluating
				 {'precision': {'supports': 0.0, 'contradicts': 0.08562572646261139, 'parts_of_same': 0.2140845070422535}, 'recall': {'supports': 0.0, 'contradicts': 0.8467432950191571, 'parts_of_same': 0.13893967093235832}, 'f1': {'supports': 0.0, 'contradicts': 0.15552427867698804, 'parts_of_same': 0.16851441241685144}, 'support': {'supports': 2128, 'contradicts': 261, 'parts_of_same': 547}, 'micro_avg': {'precision': 0.10115803814713896, 'recall': 0.10115803814713896, 'f1': 0.10115803814713896, 'support': None}, 'macro_avg': {'precision': 0.09990341116828831, 'recall': 0.32856098865050515, 'f1': 0.10801289703127982, 'support': None}, 'weighted_avg': {'precision': 0.04749745911405118, 'recall': 0.10115803814713896, 'f1': 0.04522112408947943, 'support': None}}
Loss: tensor(0.4224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3281, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 2---------------
Evaluating
				 {'precision': {'supports': 0.9196261682242991, 'contradicts': 0.3032904148783977, 'parts_of_same': 0.6550632911392406}, 'recall': {'supports': 0.6932832315641146, 'contradicts': 0.8153846153846154, 'parts_of_same': 0.7568555758683729}, 'f1': {'supports': 0.7905731119442958, 'contradicts': 0.4421272158498436, 'parts_of_same': 0.7022900763358779}, 'support': {'supports': 2129, 'contradicts': 260, 'parts_of_same': 547}, 'micro_avg': {'precision': 0.7159400544959128, 'recall': 0.7159400544959128, 'f1': 0.7159400544959128, 'support': None}, 'macro_avg': {'precision': 0.6259932914139791, 'recall': 0.7551744742723677, 'f1': 0.6449968013766724, 'support': None}, 'weighted_avg': {'precision': 0.8157558720269349, 'recall': 0.7159400544959128, 'f1': 0.7432683594026194, 'support': None}}
Loss: tensor(0.1458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 3---------------
Evaluating
				 {'precision': {'supports': 0.9385665529010239, 'contradicts': 0.5094850948509485, 'parts_of_same': 0.5784919653893696}, 'recall': {'supports': 0.7750117426021607, 'contradicts': 0.7203065134099617, 'parts_of_same': 0.8571428571428571}, 'f1': {'supports': 0.8489837921276048, 'contradicts': 0.5968253968253968, 'parts_of_same': 0.6907749077490776}, 'support': {'supports': 2129, 'contradicts': 261, 'parts_of_same': 546}, 'micro_avg': {'precision': 0.7854223433242506, 'recall': 0.7854223433242506, 'f1': 0.7854223433242506, 'support': None}, 'macro_avg': {'precision': 0.6755145377137808, 'recall': 0.7841537043849932, 'f1': 0.7121946989006931, 'support': None}, 'weighted_avg': {'precision': 0.8334606314662716, 'recall': 0.7854223433242506, 'f1': 0.7971461245374983, 'support': None}}
Loss: tensor(0.1929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5522, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 4---------------
Evaluating
				 {'precision': {'supports': 0.9426229508196722, 'contradicts': 0.4891304347826087, 'parts_of_same': 0.4979633401221996}, 'recall': {'supports': 0.7025375939849624, 'contradicts': 0.6896551724137931, 'parts_of_same': 0.8939670932358318}, 'f1': {'supports': 0.8050619278406032, 'contradicts': 0.5723370429252783, 'parts_of_same': 0.6396337475474166}, 'support': {'supports': 2128, 'contradicts': 261, 'parts_of_same': 547}, 'micro_avg': {'precision': 0.7370572207084468, 'recall': 0.7370572207084468, 'f1': 0.7370572207084467, 'support': None}, 'macro_avg': {'precision': 0.6432389085748268, 'recall': 0.7620532865448625, 'f1': 0.672344239437766, 'support': None}, 'weighted_avg': {'precision': 0.8194654733887488, 'recall': 0.7370572207084468, 'f1': 0.7535529327509326, 'support': None}}
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 5---------------
Evaluating
				 {'precision': {'supports': 0.9069423929098966, 'contradicts': 0.538235294117647, 'parts_of_same': 0.7168141592920354}, 'recall': {'supports': 0.8656015037593985, 'contradicts': 0.7011494252873564, 'parts_of_same': 0.7404021937842779}, 'f1': {'supports': 0.8857898533301275, 'contradicts': 0.6089850249584027, 'parts_of_same': 0.7284172661870503}, 'support': {'supports': 2128, 'contradicts': 261, 'parts_of_same': 547}, 'micro_avg': {'precision': 0.8276566757493188, 'recall': 0.8276566757493188, 'f1': 0.8276566757493188, 'support': None}, 'macro_avg': {'precision': 0.7206639487731931, 'recall': 0.7690510409436776, 'f1': 0.7410640481585268, 'support': None}, 'weighted_avg': {'precision': 0.8387432455755139, 'recall': 0.8276566757493188, 'f1': 0.8318631280670882, 'support': None}}
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 6---------------
Evaluating
				 {'precision': {'supports': 0.8985981308411215, 'contradicts': 0.5899280575539568, 'parts_of_same': 0.7760617760617761}, 'recall': {'supports': 0.9032409581963363, 'contradicts': 0.6307692307692307, 'parts_of_same': 0.7349177330895795}, 'f1': {'supports': 0.9009135628952917, 'contradicts': 0.6096654275092938, 'parts_of_same': 0.7549295774647887}, 'support': {'supports': 2129, 'contradicts': 260, 'parts_of_same': 547}, 'micro_avg': {'precision': 0.8477520435967303, 'recall': 0.8477520435967303, 'f1': 0.8477520435967303, 'support': None}, 'macro_avg': {'precision': 0.7548626548189515, 'recall': 0.7563093073517155, 'f1': 0.7551695226231248, 'support': None}, 'weighted_avg': {'precision': 0.8484340964000572, 'recall': 0.8477520435967303, 'f1': 0.8479238642471838, 'support': None}}
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 7---------------
Evaluating
				 {'precision': {'supports': 0.9017814155031295, 'contradicts': 0.5577557755775577, 'parts_of_same': 0.7284172661870504}, 'recall': {'supports': 0.8801691729323309, 'contradicts': 0.6475095785440613, 'parts_of_same': 0.7404021937842779}, 'f1': {'supports': 0.8908442330558858, 'contradicts': 0.599290780141844, 'parts_of_same': 0.7343608340888487}, 'support': {'supports': 2128, 'contradicts': 261, 'parts_of_same': 547}, 'micro_avg': {'precision': 0.8334468664850136, 'recall': 0.8334468664850136, 'f1': 0.8334468664850136, 'support': None}, 'macro_avg': {'precision': 0.7293181524225792, 'recall': 0.7560269817535566, 'f1': 0.7414986157621928, 'support': None}, 'weighted_avg': {'precision': 0.8388996438081467, 'recall': 0.8334468664850136, 'f1': 0.8357720700975976, 'support': None}}
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5447e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 8---------------
Evaluating
				 {'precision': {'supports': 0.9016620498614959, 'contradicts': 0.646551724137931, 'parts_of_same': 0.7806691449814126}, 'recall': {'supports': 0.9173320807891029, 'contradicts': 0.5747126436781609, 'parts_of_same': 0.7692307692307693}, 'f1': {'supports': 0.909429569266589, 'contradicts': 0.6085192697768763, 'parts_of_same': 0.7749077490774907}, 'support': {'supports': 2129, 'contradicts': 261, 'parts_of_same': 546}, 'micro_avg': {'precision': 0.8593324250681199, 'recall': 0.8593324250681199, 'f1': 0.8593324250681199, 'support': None}, 'macro_avg': {'precision': 0.7762943063269465, 'recall': 0.7537584978993443, 'f1': 0.764285529373652, 'support': None}, 'weighted_avg': {'precision': 0.8564829214288066, 'recall': 0.8593324250681199, 'f1': 0.8576630495152052, 'support': None}}
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 9---------------
Evaluating
				 {'precision': {'supports': 0.9045837231057062, 'contradicts': 0.6326530612244898, 'parts_of_same': 0.7685352622061483}, 'recall': {'supports': 0.9088345864661654, 'contradicts': 0.5938697318007663, 'parts_of_same': 0.7769652650822669}, 'f1': {'supports': 0.9067041725269573, 'contradicts': 0.6126482213438734, 'parts_of_same': 0.7727272727272727}, 'support': {'supports': 2128, 'contradicts': 261, 'parts_of_same': 547}, 'micro_avg': {'precision': 0.8562670299727521, 'recall': 0.8562670299727521, 'f1': 0.8562670299727521, 'support': None}, 'macro_avg': {'precision': 0.7685906821787815, 'recall': 0.7598898611163994, 'f1': 0.764026555532701, 'support': None}, 'weighted_avg': {'precision': 0.8550631471986709, 'recall': 0.8562670299727521, 'f1': 0.8556026849761357, 'support': None}}
Loss: tensor(4.1554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 10---------------
Evaluating
				 {'precision': {'supports': 0.9044496487119438, 'contradicts': 0.6285714285714286, 'parts_of_same': 0.7643884892086331}, 'recall': {'supports': 0.9069985908877407, 'contradicts': 0.5923076923076923, 'parts_of_same': 0.7769652650822669}, 'f1': {'supports': 0.9057223264540337, 'contradicts': 0.6099009900990098, 'parts_of_same': 0.7706255666364461}, 'support': {'supports': 2129, 'contradicts': 260, 'parts_of_same': 547}, 'micro_avg': {'precision': 0.8549046321525886, 'recall': 0.8549046321525886, 'f1': 0.8549046321525886, 'support': None}, 'macro_avg': {'precision': 0.7658031888306684, 'recall': 0.7587571827592333, 'f1': 0.7620829610631632, 'support': None}, 'weighted_avg': {'precision': 0.853924515372419, 'recall': 0.8549046321525886, 'f1': 0.8543560202304211, 'support': None}}
Loss: tensor(9.3373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1797e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 11---------------
Evaluating
				 {'precision': {'supports': 0.9038912330051571, 'contradicts': 0.625, 'parts_of_same': 0.7639639639639639}, 'recall': {'supports': 0.9060150375939849, 'contradicts': 0.5938697318007663, 'parts_of_same': 0.7751371115173674}, 'f1': {'supports': 0.9049518892278807, 'contradicts': 0.6090373280943026, 'parts_of_same': 0.7695099818511796}, 'support': {'supports': 2128, 'contradicts': 261, 'parts_of_same': 547}, 'micro_avg': {'precision': 0.853882833787466, 'recall': 0.853882833787466, 'f1': 0.8538828337874659, 'support': None}, 'macro_avg': {'precision': 0.7642850656563738, 'recall': 0.7583406269707061, 'f1': 0.7611663997244543, 'support': None}, 'weighted_avg': {'precision': 0.853029234374408, 'recall': 0.853882833787466, 'f1': 0.8534122353481397, 'support': None}}
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 12---------------
Evaluating
				 {'precision': {'supports': 0.9040262172284644, 'contradicts': 0.6275303643724697, 'parts_of_same': 0.7649186256781193}, 'recall': {'supports': 0.9069985908877407, 'contradicts': 0.5938697318007663, 'parts_of_same': 0.7747252747252747}, 'f1': {'supports': 0.9055099648300117, 'contradicts': 0.6102362204724409, 'parts_of_same': 0.7697907188353048}, 'support': {'supports': 2129, 'contradicts': 261, 'parts_of_same': 546}, 'micro_avg': {'precision': 0.8545640326975477, 'recall': 0.8545640326975477, 'f1': 0.8545640326975478, 'support': None}, 'macro_avg': {'precision': 0.7654917357596845, 'recall': 0.7585311991379272, 'f1': 0.7618456347125857, 'support': None}, 'weighted_avg': {'precision': 0.8535772517714131, 'recall': 0.8545640326975477, 'f1': 0.8540218328169205, 'support': None}}
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 13---------------
Evaluating
				 {'precision': {'supports': 0.9045390734674777, 'contradicts': 0.6290322580645161, 'parts_of_same': 0.7695099818511797}, 'recall': {'supports': 0.9083646616541353, 'contradicts': 0.5977011494252874, 'parts_of_same': 0.7751371115173674}, 'f1': {'supports': 0.9064478311840563, 'contradicts': 0.6129666011787819, 'parts_of_same': 0.7723132969034608}, 'support': {'supports': 2128, 'contradicts': 261, 'parts_of_same': 547}, 'micro_avg': {'precision': 0.8559264305177112, 'recall': 0.8559264305177112, 'f1': 0.8559264305177112, 'support': None}, 'macro_avg': {'precision': 0.7676937711277244, 'recall': 0.76040097419893, 'f1': 0.7639092430887664, 'support': None}, 'weighted_avg': {'precision': 0.8548905067323659, 'recall': 0.8559264305177112, 'f1': 0.8553680657607379, 'support': None}}
Loss: tensor(3.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8121e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 14---------------
Evaluating
				 {'precision': {'supports': 0.9046283309957924, 'contradicts': 0.631578947368421, 'parts_of_same': 0.7709090909090909}, 'recall': {'supports': 0.9093045112781954, 'contradicts': 0.5977011494252874, 'parts_of_same': 0.7751371115173674}, 'f1': {'supports': 0.9069603937192406, 'contradicts': 0.6141732283464568, 'parts_of_same': 0.773017319963537}, 'support': {'supports': 2128, 'contradicts': 261, 'parts_of_same': 547}, 'micro_avg': {'precision': 0.8566076294277929, 'recall': 0.8566076294277929, 'f1': 0.8566076294277929, 'support': None}, 'macro_avg': {'precision': 0.7690387897577682, 'recall': 0.7607142574069501, 'f1': 0.7647169806764115, 'support': None}, 'weighted_avg': {'precision': 0.8554422569310206, 'recall': 0.8566076294277929, 'f1': 0.855977998791902, 'support': None}}
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6143e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 15---------------
Evaluating
				 {'precision': {'supports': 0.9046283309957924, 'contradicts': 0.631578947368421, 'parts_of_same': 0.7709090909090909}, 'recall': {'supports': 0.9093045112781954, 'contradicts': 0.5977011494252874, 'parts_of_same': 0.7751371115173674}, 'f1': {'supports': 0.9069603937192406, 'contradicts': 0.6141732283464568, 'parts_of_same': 0.773017319963537}, 'support': {'supports': 2128, 'contradicts': 261, 'parts_of_same': 547}, 'micro_avg': {'precision': 0.8566076294277929, 'recall': 0.8566076294277929, 'f1': 0.8566076294277929, 'support': None}, 'macro_avg': {'precision': 0.7690387897577682, 'recall': 0.7607142574069501, 'f1': 0.7647169806764115, 'support': None}, 'weighted_avg': {'precision': 0.8554422569310206, 'recall': 0.8566076294277929, 'f1': 0.855977998791902, 'support': None}}
Loss: tensor(1.2667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 16---------------
Evaluating
				 {'precision': {'supports': 0.9046283309957924, 'contradicts': 0.6300813008130082, 'parts_of_same': 0.7695099818511797}, 'recall': {'supports': 0.9088774072334429, 'contradicts': 0.5961538461538461, 'parts_of_same': 0.7751371115173674}, 'f1': {'supports': 0.9067478912839738, 'contradicts': 0.6126482213438735, 'parts_of_same': 0.7723132969034608}, 'support': {'supports': 2129, 'contradicts': 260, 'parts_of_same': 547}, 'micro_avg': {'precision': 0.8562670299727521, 'recall': 0.8562670299727521, 'f1': 0.8562670299727521, 'support': None}, 'macro_avg': {'precision': 0.7680732045533268, 'recall': 0.7600561216348855, 'f1': 0.7639031365104362, 'support': None}, 'weighted_avg': {'precision': 0.8551419669530039, 'recall': 0.8562670299727521, 'f1': 0.8556574153607562, 'support': None}}
Loss: tensor(9.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 17---------------
Evaluating
				 {'precision': {'supports': 0.9045390734674777, 'contradicts': 0.6290322580645161, 'parts_of_same': 0.7695099818511797}, 'recall': {'supports': 0.9083646616541353, 'contradicts': 0.5977011494252874, 'parts_of_same': 0.7751371115173674}, 'f1': {'supports': 0.9064478311840563, 'contradicts': 0.6129666011787819, 'parts_of_same': 0.7723132969034608}, 'support': {'supports': 2128, 'contradicts': 261, 'parts_of_same': 547}, 'micro_avg': {'precision': 0.8559264305177112, 'recall': 0.8559264305177112, 'f1': 0.8559264305177112, 'support': None}, 'macro_avg': {'precision': 0.7676937711277244, 'recall': 0.76040097419893, 'f1': 0.7639092430887664, 'support': None}, 'weighted_avg': {'precision': 0.8548905067323659, 'recall': 0.8559264305177112, 'f1': 0.8553680657607379, 'support': None}}
Loss: tensor(2.5963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 18---------------
Evaluating
				 {'precision': {'supports': 0.9046283309957924, 'contradicts': 0.6275303643724697, 'parts_of_same': 0.7709090909090909}, 'recall': {'supports': 0.9088774072334429, 'contradicts': 0.5961538461538461, 'parts_of_same': 0.7751371115173674}, 'f1': {'supports': 0.9067478912839738, 'contradicts': 0.6114398422090729, 'parts_of_same': 0.773017319963537}, 'support': {'supports': 2129, 'contradicts': 260, 'parts_of_same': 547}, 'micro_avg': {'precision': 0.8562670299727521, 'recall': 0.8562670299727521, 'f1': 0.8562670299727521, 'support': None}, 'macro_avg': {'precision': 0.767689262092451, 'recall': 0.7600561216348855, 'f1': 0.7637350178188612, 'support': None}, 'weighted_avg': {'precision': 0.8551767316601352, 'recall': 0.8562670299727521, 'f1': 0.8556815713685267, 'support': None}}
Loss: tensor(3.5514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 19---------------
Evaluating
				 {'precision': {'supports': 0.9042950513538749, 'contradicts': 0.6300813008130082, 'parts_of_same': 0.7737226277372263}, 'recall': {'supports': 0.9102443609022557, 'contradicts': 0.5938697318007663, 'parts_of_same': 0.7751371115173674}, 'f1': {'supports': 0.9072599531615926, 'contradicts': 0.6114398422090731, 'parts_of_same': 0.7744292237442921}, 'support': {'supports': 2128, 'contradicts': 261, 'parts_of_same': 547}, 'micro_avg': {'precision': 0.8569482288828338, 'recall': 0.8569482288828338, 'f1': 0.8569482288828338, 'support': None}, 'macro_avg': {'precision': 0.7693663266347032, 'recall': 0.7597504014067965, 'f1': 0.7643763397049859, 'support': None}, 'weighted_avg': {'precision': 0.855591745969177, 'recall': 0.8569482288828338, 'f1': 0.8562151786555057, 'support': None}}
Loss: tensor(7.5518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 20---------------
Evaluating
				 {'precision': {'supports': 0.9042950513538749, 'contradicts': 0.6300813008130082, 'parts_of_same': 0.7718978102189781}, 'recall': {'supports': 0.909816815406294, 'contradicts': 0.5938697318007663, 'parts_of_same': 0.7747252747252747}, 'f1': {'supports': 0.9070475298524936, 'contradicts': 0.6114398422090731, 'parts_of_same': 0.773308957952468}, 'support': {'supports': 2129, 'contradicts': 261, 'parts_of_same': 546}, 'micro_avg': {'precision': 0.8566076294277929, 'recall': 0.8566076294277929, 'f1': 0.8566076294277929, 'support': None}, 'macro_avg': {'precision': 0.7687580541286204, 'recall': 0.7594706073107783, 'f1': 0.7639321100046783, 'support': None}, 'weighted_avg': {'precision': 0.8552968624741679, 'recall': 0.8566076294277929, 'f1': 0.8558980520826207, 'support': None}}
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9609e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 21---------------
Evaluating
				 {'precision': {'supports': 0.9039179104477612, 'contradicts': 0.6337448559670782, 'parts_of_same': 0.7723132969034608}, 'recall': {'supports': 0.9107142857142857, 'contradicts': 0.5900383141762452, 'parts_of_same': 0.7751371115173674}, 'f1': {'supports': 0.9073033707865168, 'contradicts': 0.611111111111111, 'parts_of_same': 0.7737226277372263}, 'support': {'supports': 2128, 'contradicts': 261, 'parts_of_same': 547}, 'micro_avg': {'precision': 0.8569482288828338, 'recall': 0.8569482288828338, 'f1': 0.8569482288828338, 'support': None}, 'macro_avg': {'precision': 0.7699920211061001, 'recall': 0.7586299038026327, 'f1': 0.7640457032116181, 'support': None}, 'weighted_avg': {'precision': 0.8553815034899306, 'recall': 0.8569482288828338, 'f1': 0.8560857801110253, 'support': None}}
Loss: tensor(6.4458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 22---------------
Evaluating
				 {'precision': {'supports': 0.9038730751283248, 'contradicts': 0.6311475409836066, 'parts_of_same': 0.7723132969034608}, 'recall': {'supports': 0.9102443609022557, 'contradicts': 0.5900383141762452, 'parts_of_same': 0.7751371115173674}, 'f1': {'supports': 0.9070475298524936, 'contradicts': 0.6099009900990099, 'parts_of_same': 0.7737226277372263}, 'support': {'supports': 2128, 'contradicts': 261, 'parts_of_same': 547}, 'micro_avg': {'precision': 0.8566076294277929, 'recall': 0.8566076294277929, 'f1': 0.8566076294277929, 'support': None}, 'macro_avg': {'precision': 0.7691113043384642, 'recall': 0.7584732621986228, 'f1': 0.7635570492295766, 'support': None}, 'weighted_avg': {'precision': 0.8551181149441383, 'recall': 0.8566076294277929, 'f1': 0.8557927722459846, 'support': None}}
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1174e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 23---------------
Evaluating
				 {'precision': {'supports': 0.9034514925373134, 'contradicts': 0.6322314049586777, 'parts_of_same': 0.7727272727272727}, 'recall': {'supports': 0.9102443609022557, 'contradicts': 0.5862068965517241, 'parts_of_same': 0.7769652650822669}, 'f1': {'supports': 0.9068352059925094, 'contradicts': 0.6083499005964214, 'parts_of_same': 0.7748404740200546}, 'support': {'supports': 2128, 'contradicts': 261, 'parts_of_same': 547}, 'micro_avg': {'precision': 0.8566076294277929, 'recall': 0.8566076294277929, 'f1': 0.8566076294277929, 'support': None}, 'macro_avg': {'precision': 0.7694700567410879, 'recall': 0.7578055075120823, 'f1': 0.7633418602029951, 'support': None}, 'weighted_avg': {'precision': 0.8549860323553937, 'recall': 0.8566076294277929, 'f1': 0.8557092580710818, 'support': None}}
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6046e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 24---------------
Evaluating
				 {'precision': {'supports': 0.9030754892823858, 'contradicts': 0.6317991631799164, 'parts_of_same': 0.7713248638838476}, 'recall': {'supports': 0.9107142857142857, 'contradicts': 0.578544061302682, 'parts_of_same': 0.7769652650822669}, 'f1': {'supports': 0.9068788020589611, 'contradicts': 0.604, 'parts_of_same': 0.7741347905282333}, 'support': {'supports': 2128, 'contradicts': 261, 'parts_of_same': 547}, 'micro_avg': {'precision': 0.8562670299727521, 'recall': 0.8562670299727521, 'f1': 0.8562670299727521, 'support': None}, 'macro_avg': {'precision': 0.7687331721153833, 'recall': 0.7554078706997448, 'f1': 0.7616711975290648, 'support': None}, 'weighted_avg': {'precision': 0.8544138022232084, 'recall': 0.8562670299727521, 'f1': 0.8552226911445547, 'support': None}}
Loss: tensor(3.6919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6530e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 25---------------
Evaluating
				 {'precision': {'supports': 0.9031657355679702, 'contradicts': 0.6371308016877637, 'parts_of_same': 0.7713248638838476}, 'recall': {'supports': 0.9116541353383458, 'contradicts': 0.578544061302682, 'parts_of_same': 0.7769652650822669}, 'f1': {'supports': 0.9073900841908326, 'contradicts': 0.606425702811245, 'parts_of_same': 0.7741347905282333}, 'support': {'supports': 2128, 'contradicts': 261, 'parts_of_same': 547}, 'micro_avg': {'precision': 0.8569482288828338, 'recall': 0.8569482288828338, 'f1': 0.8569482288828338, 'support': None}, 'macro_avg': {'precision': 0.7705404670465271, 'recall': 0.755721153907765, 'f1': 0.7626501925101036, 'support': None}, 'weighted_avg': {'precision': 0.8549531761149903, 'recall': 0.8569482288828338, 'f1': 0.8558089025922241, 'support': None}}
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3386e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 26---------------
Evaluating
				 {'precision': {'supports': 0.9027454630060493, 'contradicts': 0.6371308016877637, 'parts_of_same': 0.7709090909090909}, 'recall': {'supports': 0.9116541353383458, 'contradicts': 0.578544061302682, 'parts_of_same': 0.7751371115173674}, 'f1': {'supports': 0.9071779284545242, 'contradicts': 0.606425702811245, 'parts_of_same': 0.773017319963537}, 'support': {'supports': 2128, 'contradicts': 261, 'parts_of_same': 547}, 'micro_avg': {'precision': 0.8566076294277929, 'recall': 0.8566076294277929, 'f1': 0.8566076294277929, 'support': None}, 'macro_avg': {'precision': 0.770261785200968, 'recall': 0.7551117693861317, 'f1': 0.762206983743102, 'support': None}, 'weighted_avg': {'precision': 0.8545711026037643, 'recall': 0.8566076294277929, 'f1': 0.8554469394431258, 'support': None}}
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9339e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4674e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8252e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 27---------------
Evaluating
				 {'precision': {'supports': 0.9031657355679702, 'contradicts': 0.6371308016877637, 'parts_of_same': 0.7713248638838476}, 'recall': {'supports': 0.9116541353383458, 'contradicts': 0.578544061302682, 'parts_of_same': 0.7769652650822669}, 'f1': {'supports': 0.9073900841908326, 'contradicts': 0.606425702811245, 'parts_of_same': 0.7741347905282333}, 'support': {'supports': 2128, 'contradicts': 261, 'parts_of_same': 547}, 'micro_avg': {'precision': 0.8569482288828338, 'recall': 0.8569482288828338, 'f1': 0.8569482288828338, 'support': None}, 'macro_avg': {'precision': 0.7705404670465271, 'recall': 0.755721153907765, 'f1': 0.7626501925101036, 'support': None}, 'weighted_avg': {'precision': 0.8549531761149903, 'recall': 0.8569482288828338, 'f1': 0.8558089025922241, 'support': None}}
Loss: tensor(2.3025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7867e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2174e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8206e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0627e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8206e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2775e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 28---------------
Evaluating
				 {'precision': {'supports': 0.903210795718939, 'contradicts': 0.6371308016877637, 'parts_of_same': 0.7727272727272727}, 'recall': {'supports': 0.912124060150376, 'contradicts': 0.578544061302682, 'parts_of_same': 0.7769652650822669}, 'f1': {'supports': 0.9076455459434183, 'contradicts': 0.606425702811245, 'parts_of_same': 0.7748404740200546}, 'support': {'supports': 2128, 'contradicts': 261, 'parts_of_same': 547}, 'micro_avg': {'precision': 0.8572888283378747, 'recall': 0.8572888283378747, 'f1': 0.8572888283378748, 'support': None}, 'macro_avg': {'precision': 0.7710229567113251, 'recall': 0.7558777955117749, 'f1': 0.7629705742582393, 'support': None}, 'weighted_avg': {'precision': 0.8552471153651998, 'recall': 0.8572888283378747, 'f1': 0.8561255345675405, 'support': None}}
Loss: tensor(3.4599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8633e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9766e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2437e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9678e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8817e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6657e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3202e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3386e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8817e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 29---------------
Evaluating
				 {'precision': {'supports': 0.9028810408921933, 'contradicts': 0.6425531914893617, 'parts_of_same': 0.7723132969034608}, 'recall': {'supports': 0.9130639097744361, 'contradicts': 0.578544061302682, 'parts_of_same': 0.7751371115173674}, 'f1': {'supports': 0.9079439252336449, 'contradicts': 0.6088709677419356, 'parts_of_same': 0.7737226277372263}, 'support': {'supports': 2128, 'contradicts': 261, 'parts_of_same': 547}, 'micro_avg': {'precision': 0.8576294277929155, 'recall': 0.8576294277929155, 'f1': 0.8576294277929155, 'support': None}, 'macro_avg': {'precision': 0.772582509761672, 'recall': 0.7555816941981618, 'f1': 0.7635125069042689, 'support': None}, 'weighted_avg': {'precision': 0.8554130147832099, 'recall': 0.8576294277929155, 'f1': 0.8563509103712889, 'support': None}}
Loss: tensor(1.8988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4847e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0104e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1392e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9766e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7771e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7771e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6484e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4924e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9766e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2437e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1914e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7789e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0627e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6840e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2437e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4674e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 30---------------
Evaluating
				 {'precision': {'supports': 0.9029712163416899, 'contradicts': 0.6452991452991453, 'parts_of_same': 0.7718978102189781}, 'recall': {'supports': 0.9135744480976985, 'contradicts': 0.578544061302682, 'parts_of_same': 0.7747252747252747}, 'f1': {'supports': 0.9082418865281345, 'contradicts': 0.6101010101010101, 'parts_of_same': 0.773308957952468}, 'support': {'supports': 2129, 'contradicts': 261, 'parts_of_same': 546}, 'micro_avg': {'precision': 0.8579700272479565, 'recall': 0.8579700272479565, 'f1': 0.8579700272479566, 'support': None}, 'macro_avg': {'precision': 0.7733893906199377, 'recall': 0.7556145947085517, 'f1': 0.7638839515272043, 'support': None}, 'weighted_avg': {'precision': 0.8556897142009866, 'recall': 0.8579700272479565, 'f1': 0.8566451059594038, 'support': None}}
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9766e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1576e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2341e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1392e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2437e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4247e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8920e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0531e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8294e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9339e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1304e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8650e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6484e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5029e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3386e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2341e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1591e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9155e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6396e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9339e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7789e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9920e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0548e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8468e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4847e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9155e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6161e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7006e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6657e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4350e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)


		-------------RUN 3-----------
			------------EPOCH 1---------------
Evaluating
				 {'precision': {'supports': 0.7294011706438541, 'contradicts': 0.19852164730728616, 'parts_of_same': 0.24}, 'recall': {'supports': 0.6769745089845383, 'contradicts': 0.5987261146496815, 'parts_of_same': 0.058919803600654665}, 'f1': {'supports': 0.7022106631989598, 'contradicts': 0.29817605075337034, 'parts_of_same': 0.09461235216819973}, 'support': {'supports': 2393, 'contradicts': 314, 'parts_of_same': 611}, 'micro_avg': {'precision': 0.5557564798071127, 'recall': 0.5557564798071127, 'f1': 0.5557564798071127, 'support': None}, 'macro_avg': {'precision': 0.38930760598371345, 'recall': 0.44487347574495817, 'f1': 0.36499968870684324, 'support': None}, 'weighted_avg': {'precision': 0.589039420917791, 'recall': 0.5557564798071127, 'f1': 0.552087264661374, 'support': None}}
Loss: tensor(1.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4508, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 2---------------
Evaluating
				 {'precision': {'supports': 0.9485981308411215, 'contradicts': 0.5953307392996109, 'parts_of_same': 0.3761996161228407}, 'recall': {'supports': 0.5938152946092771, 'contradicts': 0.4872611464968153, 'parts_of_same': 0.9623567921440261}, 'f1': {'supports': 0.7304034952454381, 'contradicts': 0.5359019264448336, 'parts_of_same': 0.5409383624655014}, 'support': {'supports': 2393, 'contradicts': 314, 'parts_of_same': 611}, 'micro_avg': {'precision': 0.6515973477998794, 'recall': 0.6515973477998794, 'f1': 0.6515973477998794, 'support': None}, 'macro_avg': {'precision': 0.6400428287545245, 'recall': 0.6811444110833729, 'f1': 0.6024145947185909, 'support': None}, 'weighted_avg': {'precision': 0.8097610442115544, 'recall': 0.6515973477998794, 'f1': 0.6771073262484727, 'support': None}}
Loss: tensor(2.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 3---------------
Evaluating
				 {'precision': {'supports': 0.8995215311004785, 'contradicts': 0.5606060606060606, 'parts_of_same': 0.6589259796806967}, 'recall': {'supports': 0.8641872127037192, 'contradicts': 0.589171974522293, 'parts_of_same': 0.7430441898527005}, 'f1': {'supports': 0.8815004262574596, 'contradicts': 0.5745341614906833, 'parts_of_same': 0.6984615384615385}, 'support': {'supports': 2393, 'contradicts': 314, 'parts_of_same': 611}, 'micro_avg': {'precision': 0.8158529234478602, 'recall': 0.8158529234478602, 'f1': 0.8158529234478603, 'support': None}, 'macro_avg': {'precision': 0.7063511904624119, 'recall': 0.7321344590262376, 'f1': 0.7181653754032271, 'support': None}, 'weighted_avg': {'precision': 0.823143188830215, 'recall': 0.8158529234478602, 'f1': 0.8187444987167497, 'support': None}}
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 4---------------
Evaluating
				 {'precision': {'supports': 0.8869778869778869, 'contradicts': 0.6851063829787234, 'parts_of_same': 0.6942277691107644}, 'recall': {'supports': 0.90513999164229, 'contradicts': 0.5127388535031847, 'parts_of_same': 0.7283142389525368}, 'f1': {'supports': 0.8959669079627715, 'contradicts': 0.5865209471766849, 'parts_of_same': 0.7108626198083068}, 'support': {'supports': 2393, 'contradicts': 314, 'parts_of_same': 611}, 'micro_avg': {'precision': 0.8354430379746836, 'recall': 0.8354430379746836, 'f1': 0.8354430379746836, 'support': None}, 'macro_avg': {'precision': 0.7554373463557916, 'recall': 0.7153976946993371, 'f1': 0.7311168249825878, 'support': None}, 'weighted_avg': {'precision': 0.8323793413864012, 'recall': 0.8354430379746836, 'f1': 0.8325959761516778, 'support': None}}
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 5---------------
Evaluating
				 {'precision': {'supports': 0.8717538953256093, 'contradicts': 0.6761904761904762, 'parts_of_same': 0.6942148760330579}, 'recall': {'supports': 0.9118261596322608, 'contradicts': 0.45222929936305734, 'parts_of_same': 0.6873977086743044}, 'f1': {'supports': 0.8913398692810458, 'contradicts': 0.5419847328244276, 'parts_of_same': 0.6907894736842105}, 'support': {'supports': 2393, 'contradicts': 314, 'parts_of_same': 611}, 'micro_avg': {'precision': 0.8270042194092827, 'recall': 0.8270042194092827, 'f1': 0.8270042194092827, 'support': None}, 'macro_avg': {'precision': 0.7473864158497144, 'recall': 0.6838177225565408, 'f1': 0.708038025263228, 'support': None}, 'weighted_avg': {'precision': 0.8205533967131377, 'recall': 0.8270042194092827, 'f1': 0.8213477642307009, 'support': None}}
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(10.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 6---------------
Evaluating
				 {'precision': {'supports': 0.8876033057851239, 'contradicts': 0.5251396648044693, 'parts_of_same': 0.7759259259259259}, 'recall': {'supports': 0.897618052653573, 'contradicts': 0.5987261146496815, 'parts_of_same': 0.6857610474631751}, 'f1': {'supports': 0.8925825888219405, 'contradicts': 0.5595238095238095, 'parts_of_same': 0.7280625543006082}, 'support': {'supports': 2393, 'contradicts': 314, 'parts_of_same': 611}, 'micro_avg': {'precision': 0.8303194695599759, 'recall': 0.8303194695599759, 'f1': 0.8303194695599759, 'support': None}, 'macro_avg': {'precision': 0.7295562988385065, 'recall': 0.7273684049221432, 'f1': 0.7267229842154528, 'support': None}, 'weighted_avg': {'precision': 0.8327363792143295, 'recall': 0.8303194695599759, 'f1': 0.8307675804457659, 'support': None}}
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 7---------------
Evaluating
				 {'precision': {'supports': 0.934409687184662, 'contradicts': 0.529891304347826, 'parts_of_same': 0.5557851239669421}, 'recall': {'supports': 0.7739239448391141, 'contradicts': 0.6210191082802548, 'parts_of_same': 0.8805237315875614}, 'f1': {'supports': 0.8466285714285714, 'contradicts': 0.5718475073313783, 'parts_of_same': 0.681443951868271}, 'support': {'supports': 2393, 'contradicts': 314, 'parts_of_same': 611}, 'micro_avg': {'precision': 0.7790837854128994, 'recall': 0.7790837854128994, 'f1': 0.7790837854128994, 'support': None}, 'macro_avg': {'precision': 0.67336203849981, 'recall': 0.7584889282356434, 'f1': 0.6999733435427403, 'support': None}, 'weighted_avg': {'precision': 0.826405353147051, 'recall': 0.7790837854128994, 'f1': 0.7902063120319884, 'support': None}}
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8144, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 8---------------
Evaluating
				 {'precision': {'supports': 0.9126478616924477, 'contradicts': 0.473568281938326, 'parts_of_same': 0.7072072072072072}, 'recall': {'supports': 0.8382783117425825, 'contradicts': 0.6847133757961783, 'parts_of_same': 0.7708674304418985}, 'f1': {'supports': 0.8738836854715748, 'contradicts': 0.5598958333333334, 'parts_of_same': 0.7376664056382145}, 'support': {'supports': 2393, 'contradicts': 314, 'parts_of_same': 611}, 'micro_avg': {'precision': 0.811332127787824, 'recall': 0.811332127787824, 'f1': 0.811332127787824, 'support': None}, 'macro_avg': {'precision': 0.6978077836126603, 'recall': 0.7646197059935531, 'f1': 0.7238153081477076, 'support': None}, 'weighted_avg': {'precision': 0.8332641281381148, 'recall': 0.811332127787824, 'f1': 0.8190853299713966, 'support': None}}
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1038e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 9---------------
Evaluating
				 {'precision': {'supports': 0.8831587429492345, 'contradicts': 0.5874587458745875, 'parts_of_same': 0.7954971857410882}, 'recall': {'supports': 0.9160050146259925, 'contradicts': 0.5668789808917197, 'parts_of_same': 0.6939443535188216}, 'f1': {'supports': 0.8992820512820512, 'contradicts': 0.5769854132901134, 'parts_of_same': 0.7412587412587412}, 'support': {'supports': 2393, 'contradicts': 314, 'parts_of_same': 611}, 'micro_avg': {'precision': 0.8420735382760699, 'recall': 0.8420735382760699, 'f1': 0.8420735382760699, 'support': None}, 'macro_avg': {'precision': 0.7553715581883034, 'recall': 0.7256094496788447, 'f1': 0.7391754019436353, 'support': None}, 'weighted_avg': {'precision': 0.8390324588818395, 'recall': 0.8420735382760699, 'f1': 0.8396818744424759, 'support': None}}
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 10---------------
Evaluating
				 {'precision': {'supports': 0.881858229875851, 'contradicts': 0.6299212598425197, 'parts_of_same': 0.7795414462081128}, 'recall': {'supports': 0.9201838696197242, 'contradicts': 0.5095541401273885, 'parts_of_same': 0.723404255319149}, 'f1': {'supports': 0.9006134969325154, 'contradicts': 0.5633802816901408, 'parts_of_same': 0.7504244482173175}, 'support': {'supports': 2393, 'contradicts': 314, 'parts_of_same': 611}, 'micro_avg': {'precision': 0.8450874020494273, 'recall': 0.8450874020494273, 'f1': 0.8450874020494273, 'support': None}, 'macro_avg': {'precision': 0.7637736453088279, 'recall': 0.7177140883554206, 'f1': 0.7381394089466579, 'support': None}, 'weighted_avg': {'precision': 0.8391747568766184, 'recall': 0.8450874020494273, 'f1': 0.8410424486048808, 'support': None}}
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 11---------------
Evaluating
				 {'precision': {'supports': 0.8928416485900217, 'contradicts': 0.52046783625731, 'parts_of_same': 0.6676602086438153}, 'recall': {'supports': 0.8600083577099875, 'contradicts': 0.5668789808917197, 'parts_of_same': 0.7332242225859247}, 'f1': {'supports': 0.876117496807152, 'contradicts': 0.5426829268292682, 'parts_of_same': 0.6989079563182528}, 'support': {'supports': 2393, 'contradicts': 314, 'parts_of_same': 611}, 'micro_avg': {'precision': 0.8089210367691381, 'recall': 0.8089210367691381, 'f1': 0.8089210367691381, 'support': None}, 'macro_avg': {'precision': 0.6936565644970489, 'recall': 0.720037187062544, 'f1': 0.7059027933182244, 'support': None}, 'weighted_avg': {'precision': 0.8161354289156384, 'recall': 0.8089210367691381, 'f1': 0.8119301899319944, 'support': None}}
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0224e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 12---------------
Evaluating
				 {'precision': {'supports': 0.8878048780487805, 'contradicts': 0.660377358490566, 'parts_of_same': 0.7244582043343654}, 'recall': {'supports': 0.9126619306310071, 'contradicts': 0.445859872611465, 'parts_of_same': 0.7659574468085106}, 'f1': {'supports': 0.9000618174325159, 'contradicts': 0.532319391634981, 'parts_of_same': 0.7446300715990453}, 'support': {'supports': 2393, 'contradicts': 314, 'parts_of_same': 611}, 'micro_avg': {'precision': 0.8414707655213984, 'recall': 0.8414707655213984, 'f1': 0.8414707655213984, 'support': None}, 'macro_avg': {'precision': 0.7575468136245705, 'recall': 0.7081597500169942, 'f1': 0.7256704268888474, 'support': None}, 'weighted_avg': {'precision': 0.8362023889647578, 'recall': 0.8414707655213984, 'f1': 0.8366380927777007, 'support': None}}
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 13---------------
Evaluating
				 {'precision': {'supports': 0.9034188034188034, 'contradicts': 0.5488505747126436, 'parts_of_same': 0.7111111111111111}, 'recall': {'supports': 0.8834099456748851, 'contradicts': 0.60828025477707, 'parts_of_same': 0.7332242225859247}, 'f1': {'supports': 0.89330234523558, 'contradicts': 0.5770392749244713, 'parts_of_same': 0.7219983883964544}, 'support': {'supports': 2393, 'contradicts': 314, 'parts_of_same': 611}, 'micro_avg': {'precision': 0.8297166968053044, 'recall': 0.8297166968053044, 'f1': 0.8297166968053044, 'support': None}, 'macro_avg': {'precision': 0.7211268297475194, 'recall': 0.7416381410126266, 'f1': 0.7307800028521685, 'support': None}, 'weighted_avg': {'precision': 0.8344512254158697, 'recall': 0.8297166968053044, 'f1': 0.8318275647333516, 'support': None}}
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 14---------------
Evaluating
				 {'precision': {'supports': 0.9386138613861386, 'contradicts': 0.4503464203233256, 'parts_of_same': 0.6138728323699422}, 'recall': {'supports': 0.7923109068115336, 'contradicts': 0.6210191082802548, 'parts_of_same': 0.8690671031096563}, 'f1': {'supports': 0.8592794017675052, 'contradicts': 0.5220883534136546, 'parts_of_same': 0.7195121951219512}, 'support': {'supports': 2393, 'contradicts': 314, 'parts_of_same': 611}, 'micro_avg': {'precision': 0.7902350813743219, 'recall': 0.7902350813743219, 'f1': 0.7902350813743219, 'support': None}, 'macro_avg': {'precision': 0.6676110380264687, 'recall': 0.7607990394004815, 'f1': 0.7002933167677036, 'support': None}, 'weighted_avg': {'precision': 0.832606403513137, 'recall': 0.7902350813743219, 'f1': 0.8016314956663771, 'support': None}}
Loss: tensor(9.3644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4081, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 15---------------
Evaluating
				 {'precision': {'supports': 0.9557216791259344, 'contradicts': 0.4750593824228028, 'parts_of_same': 0.49654576856649396}, 'recall': {'supports': 0.6945256999582115, 'contradicts': 0.6369426751592356, 'parts_of_same': 0.9410801963993454}, 'f1': {'supports': 0.8044530493707648, 'contradicts': 0.5442176870748299, 'parts_of_same': 0.6500847936687394}, 'support': {'supports': 2393, 'contradicts': 314, 'parts_of_same': 611}, 'micro_avg': {'precision': 0.7344786015672091, 'recall': 0.7344786015672091, 'f1': 0.7344786015672091, 'support': None}, 'macro_avg': {'precision': 0.6424422767050771, 'recall': 0.7575161905055975, 'f1': 0.6662518433714446, 'support': None}, 'weighted_avg': {'precision': 0.8256781461191226, 'recall': 0.7344786015672091, 'f1': 0.7513991289383172, 'support': None}}
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 16---------------
Evaluating
				 {'precision': {'supports': 0.9227854097584084, 'contradicts': 0.4321223709369025, 'parts_of_same': 0.7002923976608187}, 'recall': {'supports': 0.8140409527789386, 'contradicts': 0.7197452229299363, 'parts_of_same': 0.7839607201309329}, 'f1': {'supports': 0.8650088809946714, 'contradicts': 0.5400238948626045, 'parts_of_same': 0.7397683397683397}, 'support': {'supports': 2393, 'contradicts': 314, 'parts_of_same': 611}, 'micro_avg': {'precision': 0.79957805907173, 'recall': 0.79957805907173, 'f1': 0.79957805907173, 'support': None}, 'macro_avg': {'precision': 0.6850667261187099, 'recall': 0.7725822986132692, 'f1': 0.7149337052085386, 'support': None}, 'weighted_avg': {'precision': 0.8353799171177875, 'recall': 0.79957805907173, 'f1': 0.8111911424971556, 'support': None}}
Loss: tensor(2.9650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 17---------------
Evaluating
				 {'precision': {'supports': 0.9057569296375266, 'contradicts': 0.5562310030395137, 'parts_of_same': 0.7375776397515528}, 'recall': {'supports': 0.8875888006686168, 'contradicts': 0.5828025477707006, 'parts_of_same': 0.7774140752864157}, 'f1': {'supports': 0.8965808357956943, 'contradicts': 0.5692068429237946, 'parts_of_same': 0.7569721115537849}, 'support': {'supports': 2393, 'contradicts': 314, 'parts_of_same': 611}, 'micro_avg': {'precision': 0.838456901748041, 'recall': 0.838456901748041, 'f1': 0.8384569017480409, 'support': None}, 'macro_avg': {'precision': 0.7331885241428644, 'recall': 0.7492684745752444, 'f1': 0.7409199300910911, 'support': None}, 'weighted_avg': {'precision': 0.8417097062884892, 'recall': 0.838456901748041, 'f1': 0.8398911539772544, 'support': None}}
Loss: tensor(0.4672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 18---------------
Evaluating
				 {'precision': {'supports': 0.9013074652045551, 'contradicts': 0.5691823899371069, 'parts_of_same': 0.7360890302066773}, 'recall': {'supports': 0.893021312160468, 'contradicts': 0.5764331210191083, 'parts_of_same': 0.7577741407528642}, 'f1': {'supports': 0.8971452560873215, 'contradicts': 0.5727848101265822, 'parts_of_same': 0.7467741935483871}, 'support': {'supports': 2393, 'contradicts': 314, 'parts_of_same': 611}, 'micro_avg': {'precision': 0.8381555153707052, 'recall': 0.8381555153707052, 'f1': 0.8381555153707052, 'support': None}, 'macro_avg': {'precision': 0.7355262951161131, 'recall': 0.7424095246441468, 'f1': 0.7389014199207636, 'support': None}, 'weighted_avg': {'precision': 0.8394522098044097, 'recall': 0.8381555153707052, 'f1': 0.838758909118376, 'support': None}}
Loss: tensor(5.2605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0911e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 19---------------
Evaluating
				 {'precision': {'supports': 0.8936082474226804, 'contradicts': 0.5644699140401146, 'parts_of_same': 0.7904411764705882}, 'recall': {'supports': 0.9055578771416631, 'contradicts': 0.6273885350318471, 'parts_of_same': 0.7037643207855974}, 'f1': {'supports': 0.8995433789954337, 'contradicts': 0.5942684766214178, 'parts_of_same': 0.7445887445887446}, 'support': {'supports': 2393, 'contradicts': 314, 'parts_of_same': 611}, 'micro_avg': {'precision': 0.8420735382760699, 'recall': 0.8420735382760699, 'f1': 0.8420735382760699, 'support': None}, 'macro_avg': {'precision': 0.7495064459777945, 'recall': 0.7455702443197025, 'f1': 0.7461335334018654, 'support': None}, 'weighted_avg': {'precision': 0.8434622205890897, 'recall': 0.8420735382760699, 'f1': 0.8421191472389756, 'support': None}}
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2079e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 20---------------
Evaluating
				 {'precision': {'supports': 0.8931552587646077, 'contradicts': 0.5558739255014327, 'parts_of_same': 0.7521815008726004}, 'recall': {'supports': 0.8942749686585876, 'contradicts': 0.6178343949044586, 'parts_of_same': 0.7054009819967266}, 'f1': {'supports': 0.8937147629985384, 'contradicts': 0.5852187028657617, 'parts_of_same': 0.7280405405405405}, 'support': {'supports': 2393, 'contradicts': 314, 'parts_of_same': 611}, 'micro_avg': {'precision': 0.8333333333333334, 'recall': 0.8333333333333334, 'f1': 0.8333333333333334, 'support': None}, 'macro_avg': {'precision': 0.7337368950462135, 'recall': 0.7391701151865909, 'f1': 0.7356580021349468, 'support': None}, 'weighted_avg': {'precision': 0.8352766256372256, 'recall': 0.8333333333333334, 'f1': 0.8340117151373182, 'support': None}}
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 21---------------
Evaluating
				 {'precision': {'supports': 0.9006211180124224, 'contradicts': 0.6081081081081081, 'parts_of_same': 0.6068883610451307}, 'recall': {'supports': 0.8483075637275387, 'contradicts': 0.4299363057324841, 'parts_of_same': 0.8363338788870703}, 'f1': {'supports': 0.8736819453410802, 'contradicts': 0.503731343283582, 'parts_of_same': 0.7033723331039229}, 'support': {'supports': 2393, 'contradicts': 314, 'parts_of_same': 611}, 'micro_avg': {'precision': 0.8065099457504521, 'recall': 0.8065099457504521, 'f1': 0.806509945750452, 'support': None}, 'macro_avg': {'precision': 0.7052058623885538, 'recall': 0.7048592494490311, 'f1': 0.6935952072428617, 'support': None}, 'weighted_avg': {'precision': 0.8188490265064037, 'recall': 0.8065099457504521, 'f1': 0.8073095336102312, 'support': None}}
Loss: tensor(4.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3880e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 22---------------
Evaluating
				 {'precision': {'supports': 0.8958422631804543, 'contradicts': 0.49709302325581395, 'parts_of_same': 0.7207488299531981}, 'recall': {'supports': 0.873380693689929, 'contradicts': 0.5445859872611465, 'parts_of_same': 0.7561374795417348}, 'f1': {'supports': 0.8844688954718578, 'contradicts': 0.5197568389057751, 'parts_of_same': 0.7380191693290735}, 'support': {'supports': 2393, 'contradicts': 314, 'parts_of_same': 611}, 'micro_avg': {'precision': 0.820675105485232, 'recall': 0.820675105485232, 'f1': 0.820675105485232, 'support': None}, 'macro_avg': {'precision': 0.7045613721298221, 'recall': 0.7247013868309367, 'f1': 0.7140816345689021, 'support': None}, 'weighted_avg': {'precision': 0.8258635564178893, 'recall': 0.820675105485232, 'f1': 0.8229859634540786, 'support': None}}
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 23---------------
Evaluating
				 {'precision': {'supports': 0.8934935764608372, 'contradicts': 0.5656934306569343, 'parts_of_same': 0.7353407290015848}, 'recall': {'supports': 0.9009611366485583, 'contradicts': 0.49363057324840764, 'parts_of_same': 0.7594108019639935}, 'f1': {'supports': 0.8972118185601331, 'contradicts': 0.5272108843537415, 'parts_of_same': 0.747181964573269}, 'support': {'supports': 2393, 'contradicts': 314, 'parts_of_same': 611}, 'micro_avg': {'precision': 0.8363471971066908, 'recall': 0.8363471971066908, 'f1': 0.8363471971066908, 'support': None}, 'macro_avg': {'precision': 0.7315092453731188, 'recall': 0.7180008372869864, 'f1': 0.7238682224957146, 'support': None}, 'weighted_avg': {'precision': 0.8333487194445537, 'recall': 0.8363471971066908, 'f1': 0.8345691018251177, 'support': None}}
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 24---------------
Evaluating
				 {'precision': {'supports': 0.8866612111292962, 'contradicts': 0.5512367491166078, 'parts_of_same': 0.754653130287648}, 'recall': {'supports': 0.9055578771416631, 'contradicts': 0.4968152866242038, 'parts_of_same': 0.7299509001636661}, 'f1': {'supports': 0.8960099235063056, 'contradicts': 0.5226130653266331, 'parts_of_same': 0.7420965058236273}, 'support': {'supports': 2393, 'contradicts': 314, 'parts_of_same': 611}, 'micro_avg': {'precision': 0.8345388788426763, 'recall': 0.8345388788426763, 'f1': 0.8345388788426763, 'support': None}, 'macro_avg': {'precision': 0.730850363511184, 'recall': 0.7107746879765111, 'f1': 0.7202398315521886, 'support': None}, 'weighted_avg': {'precision': 0.8306093068296484, 'recall': 0.8345388788426763, 'f1': 0.8323306855097614, 'support': None}}
Loss: tensor(7.8713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4279e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 25---------------
Evaluating
				 {'precision': {'supports': 0.8918358889349358, 'contradicts': 0.5501730103806228, 'parts_of_same': 0.7418831168831169}, 'recall': {'supports': 0.8992895946510656, 'contradicts': 0.5063694267515924, 'parts_of_same': 0.7479541734860884}, 'f1': {'supports': 0.8955472326258843, 'contradicts': 0.527363184079602, 'parts_of_same': 0.7449062754686228}, 'support': {'supports': 2393, 'contradicts': 314, 'parts_of_same': 611}, 'micro_avg': {'precision': 0.8342374924653405, 'recall': 0.8342374924653405, 'f1': 0.8342374924653405, 'support': None}, 'macro_avg': {'precision': 0.7279640053995585, 'recall': 0.7178710649629153, 'f1': 0.7226055640580364, 'support': None}, 'weighted_avg': {'precision': 0.8318891476481016, 'recall': 0.8342374924653405, 'f1': 0.8329639245889284, 'support': None}}
Loss: tensor(5.7286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 26---------------
Evaluating
				 {'precision': {'supports': 0.8921609290750726, 'contradicts': 0.5501730103806228, 'parts_of_same': 0.7411003236245954}, 'recall': {'supports': 0.8988717091516925, 'contradicts': 0.5063694267515924, 'parts_of_same': 0.7495908346972177}, 'f1': {'supports': 0.8955037468776019, 'contradicts': 0.527363184079602, 'parts_of_same': 0.7453213995117982}, 'support': {'supports': 2393, 'contradicts': 314, 'parts_of_same': 611}, 'micro_avg': {'precision': 0.8342374924653405, 'recall': 0.8342374924653405, 'f1': 0.8342374924653405, 'support': None}, 'macro_avg': {'precision': 0.7278114210267637, 'recall': 0.7182773235335008, 'f1': 0.7227294434896674, 'support': None}, 'weighted_avg': {'precision': 0.8319794232280869, 'recall': 0.8342374924653405, 'f1': 0.8330090057808331, 'support': None}}
Loss: tensor(2.0794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 27---------------
Evaluating
				 {'precision': {'supports': 0.8929016189290162, 'contradicts': 0.5517241379310345, 'parts_of_same': 0.7399030694668821}, 'recall': {'supports': 0.8988717091516925, 'contradicts': 0.5095541401273885, 'parts_of_same': 0.7495908346972177}, 'f1': {'supports': 0.8958767180341525, 'contradicts': 0.5298013245033112, 'parts_of_same': 0.7447154471544716}, 'support': {'supports': 2393, 'contradicts': 314, 'parts_of_same': 611}, 'micro_avg': {'precision': 0.8345388788426763, 'recall': 0.8345388788426763, 'f1': 0.8345388788426763, 'support': None}, 'macro_avg': {'precision': 0.728176275442311, 'recall': 0.7193388946587662, 'f1': 0.7234644965639784, 'support': None}, 'weighted_avg': {'precision': 0.83243994239052, 'recall': 0.8345388788426763, 'f1': 0.8333971489937158, 'support': None}}
Loss: tensor(8.5489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 28---------------
Evaluating
				 {'precision': {'supports': 0.8928126298296635, 'contradicts': 0.5498281786941581, 'parts_of_same': 0.7387096774193549}, 'recall': {'supports': 0.8980359381529461, 'contradicts': 0.5095541401273885, 'parts_of_same': 0.7495908346972177}, 'f1': {'supports': 0.8954166666666666, 'contradicts': 0.5289256198347108, 'parts_of_same': 0.7441104792851341}, 'support': {'supports': 2393, 'contradicts': 314, 'parts_of_same': 611}, 'micro_avg': {'precision': 0.8339361060880048, 'recall': 0.8339361060880048, 'f1': 0.8339361060880048, 'support': None}, 'macro_avg': {'precision': 0.7271168286477255, 'recall': 0.7190603043258507, 'f1': 0.7228175885955039, 'support': None}, 'weighted_avg': {'precision': 0.831976577515243, 'recall': 0.8339361060880048, 'f1': 0.8328710761918775, 'support': None}}
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 29---------------
Evaluating
				 {'precision': {'supports': 0.8928571428571429, 'contradicts': 0.5498281786941581, 'parts_of_same': 0.7415185783521809}, 'recall': {'supports': 0.8984538236523193, 'contradicts': 0.5095541401273885, 'parts_of_same': 0.7512274959083469}, 'f1': {'supports': 0.8956467402624453, 'contradicts': 0.5289256198347108, 'parts_of_same': 0.7463414634146341}, 'support': {'supports': 2393, 'contradicts': 314, 'parts_of_same': 611}, 'micro_avg': {'precision': 0.8345388788426763, 'recall': 0.8345388788426763, 'f1': 0.8345388788426763, 'support': None}, 'macro_avg': {'precision': 0.728067966634494, 'recall': 0.7197451532293515, 'f1': 0.7236379411705967, 'support': None}, 'weighted_avg': {'precision': 0.832525931989238, 'recall': 0.8345388788426763, 'f1': 0.8334478385239519, 'support': None}}
Loss: tensor(4.0941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 30---------------
Evaluating
				 {'precision': {'supports': 0.8928126298296635, 'contradicts': 0.547945205479452, 'parts_of_same': 0.7399030694668821}, 'recall': {'supports': 0.8980359381529461, 'contradicts': 0.5095541401273885, 'parts_of_same': 0.7495908346972177}, 'f1': {'supports': 0.8954166666666666, 'contradicts': 0.5280528052805281, 'parts_of_same': 0.7447154471544716}, 'support': {'supports': 2393, 'contradicts': 314, 'parts_of_same': 611}, 'micro_avg': {'precision': 0.8339361060880048, 'recall': 0.8339361060880048, 'f1': 0.8339361060880048, 'support': None}, 'macro_avg': {'precision': 0.7268869682586659, 'recall': 0.7190603043258507, 'f1': 0.7227283063672222, 'support': None}, 'weighted_avg': {'precision': 0.8320181413945743, 'recall': 0.8339361060880048, 'f1': 0.8328998801696207, 'support': None}}
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)


		-------------RUN 4-----------
			------------EPOCH 1---------------
Evaluating
				 {'precision': {'supports': 0.0, 'contradicts': 0.08975217682518419, 'parts_of_same': 0.0}, 'recall': {'supports': 0.0, 'contradicts': 1.0, 'parts_of_same': 0.0}, 'f1': {'supports': 0.0, 'contradicts': 0.16472034419176398, 'parts_of_same': 0.0}, 'support': {'supports': 2200, 'contradicts': 268, 'parts_of_same': 520}, 'micro_avg': {'precision': 0.08969210174029452, 'recall': 0.08969210174029452, 'f1': 0.08969210174029452, 'support': None}, 'macro_avg': {'precision': 0.029917392275061395, 'recall': 0.3333333333333333, 'f1': 0.05490678139725466, 'support': None}, 'weighted_avg': {'precision': 0.008050061375217323, 'recall': 0.08969210174029452, 'f1': 0.014774113869944025, 'support': None}}
Loss: tensor(0.3890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3595, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 2---------------
Evaluating
				 {'precision': {'supports': 0.9493600445186422, 'contradicts': 0.6273764258555133, 'parts_of_same': 0.5161637931034483}, 'recall': {'supports': 0.7751022262607905, 'contradicts': 0.6156716417910447, 'parts_of_same': 0.9229287090558767}, 'f1': {'supports': 0.8534267133566784, 'contradicts': 0.6214689265536724, 'parts_of_same': 0.6620594333102973}, 'support': {'supports': 2201, 'contradicts': 268, 'parts_of_same': 519}, 'micro_avg': {'precision': 0.786479250334672, 'recall': 0.786479250334672, 'f1': 0.786479250334672, 'support': None}, 'macro_avg': {'precision': 0.6976334211592014, 'recall': 0.7712341923692373, 'f1': 0.712318357740216, 'support': None}, 'weighted_avg': {'precision': 0.8452367298311576, 'recall': 0.786479250334672, 'f1': 0.7993824345055146, 'support': None}}
Loss: tensor(0.1324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 3---------------
Evaluating
				 {'precision': {'supports': 0.9565217391304348, 'contradicts': 0.4215885947046843, 'parts_of_same': 0.6586059743954481}, 'recall': {'supports': 0.78, 'contradicts': 0.7723880597014925, 'parts_of_same': 0.8903846153846153}, 'f1': {'supports': 0.8592889334001002, 'contradicts': 0.5454545454545454, 'parts_of_same': 0.7571545380212592}, 'support': {'supports': 2200, 'contradicts': 268, 'parts_of_same': 520}, 'micro_avg': {'precision': 0.7985274431057564, 'recall': 0.7985274431057564, 'f1': 0.7985274431057564, 'support': None}, 'macro_avg': {'precision': 0.6789054360768557, 'recall': 0.8142575583620358, 'f1': 0.7206326722919684, 'support': None}, 'weighted_avg': {'precision': 0.8566963440941916, 'recall': 0.7985274431057564, 'f1': 0.813366074776805, 'support': None}}
Loss: tensor(1.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 4---------------
Evaluating
				 {'precision': {'supports': 0.9479553903345725, 'contradicts': 0.6116838487972509, 'parts_of_same': 0.5773955773955773}, 'recall': {'supports': 0.8113636363636364, 'contradicts': 0.664179104477612, 'parts_of_same': 0.9038461538461539}, 'f1': {'supports': 0.8743570903747244, 'contradicts': 0.6368515205724509, 'parts_of_same': 0.704647676161919}, 'support': {'supports': 2200, 'contradicts': 268, 'parts_of_same': 520}, 'micro_avg': {'precision': 0.8142570281124498, 'recall': 0.8142570281124498, 'f1': 0.8142570281124497, 'support': None}, 'macro_avg': {'precision': 0.7123449388424669, 'recall': 0.7931296315624673, 'f1': 0.7386187623696981, 'support': None}, 'weighted_avg': {'precision': 0.8533061681591109, 'recall': 0.8142570281124498, 'f1': 0.8235202804357458, 'support': None}}
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 5---------------
Evaluating
				 {'precision': {'supports': 0.9343459088682019, 'contradicts': 0.5195530726256983, 'parts_of_same': 0.7249575551782682}, 'recall': {'supports': 0.8668181818181818, 'contradicts': 0.6940298507462687, 'parts_of_same': 0.8211538461538461}, 'f1': {'supports': 0.8993161990096675, 'contradicts': 0.5942492012779552, 'parts_of_same': 0.7700631199278629}, 'support': {'supports': 2200, 'contradicts': 268, 'parts_of_same': 520}, 'micro_avg': {'precision': 0.8433734939759037, 'recall': 0.8433734939759037, 'f1': 0.8433734939759037, 'support': None}, 'macro_avg': {'precision': 0.726285512224056, 'recall': 0.7940006262394322, 'f1': 0.7545428400718285, 'support': None}, 'weighted_avg': {'precision': 0.8607025273314695, 'recall': 0.8433734939759037, 'f1': 0.8494602564010205, 'support': None}}
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 6---------------
Evaluating
				 {'precision': {'supports': 0.9192253188474256, 'contradicts': 0.5403899721448467, 'parts_of_same': 0.748046875}, 'recall': {'supports': 0.8845454545454545, 'contradicts': 0.7238805970149254, 'parts_of_same': 0.7365384615384616}, 'f1': {'supports': 0.9015520037062776, 'contradicts': 0.6188197767145136, 'parts_of_same': 0.7422480620155039}, 'support': {'supports': 2200, 'contradicts': 268, 'parts_of_same': 520}, 'micro_avg': {'precision': 0.8443775100401606, 'recall': 0.8443775100401606, 'f1': 0.8443775100401606, 'support': None}, 'macro_avg': {'precision': 0.7358873886640908, 'recall': 0.7816548376996139, 'f1': 0.7542066141454317, 'support': None}, 'weighted_avg': {'precision': 0.8554566897587533, 'recall': 0.8443775100401606, 'f1': 0.8484695785011254, 'support': None}}
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 7---------------
Evaluating
				 {'precision': {'supports': 0.9257473481195757, 'contradicts': 0.4888888888888889, 'parts_of_same': 0.7779960707269156}, 'recall': {'supports': 0.8727272727272727, 'contradicts': 0.7388059701492538, 'parts_of_same': 0.7615384615384615}, 'f1': {'supports': 0.898455779129621, 'contradicts': 0.5884101040118871, 'parts_of_same': 0.7696793002915453}, 'support': {'supports': 2200, 'contradicts': 268, 'parts_of_same': 520}, 'micro_avg': {'precision': 0.8413654618473896, 'recall': 0.8413654618473896, 'f1': 0.8413654618473895, 'support': None}, 'macro_avg': {'precision': 0.7308774359117933, 'recall': 0.7910239014716627, 'f1': 0.7521817278110179, 'support': None}, 'weighted_avg': {'precision': 0.8608515210385826, 'recall': 0.8413654618473896, 'f1': 0.8482362309611633, 'support': None}}
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 8---------------
Evaluating
				 {'precision': {'supports': 0.9112397491558129, 'contradicts': 0.43466666666666665, 'parts_of_same': 0.7685185185185185}, 'recall': {'supports': 0.8586363636363636, 'contradicts': 0.6082089552238806, 'parts_of_same': 0.7980769230769231}, 'f1': {'supports': 0.8841563304469927, 'contradicts': 0.5069984447900466, 'parts_of_same': 0.7830188679245284}, 'support': {'supports': 2200, 'contradicts': 268, 'parts_of_same': 520}, 'micro_avg': {'precision': 0.8256358768406962, 'recall': 0.8256358768406962, 'f1': 0.8256358768406962, 'support': None}, 'macro_avg': {'precision': 0.7048083114469993, 'recall': 0.7549740806457225, 'f1': 0.7247245477205225, 'support': None}, 'weighted_avg': {'precision': 0.8436572103209788, 'recall': 0.8256358768406962, 'f1': 0.8327273499022328, 'support': None}}
Loss: tensor(0.4228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 9---------------
Evaluating
				 {'precision': {'supports': 0.9188326493388053, 'contradicts': 0.6203007518796992, 'parts_of_same': 0.775047258979206}, 'recall': {'supports': 0.9159090909090909, 'contradicts': 0.6156716417910447, 'parts_of_same': 0.7884615384615384}, 'f1': {'supports': 0.9173685408604599, 'contradicts': 0.6179775280898877, 'parts_of_same': 0.7816968541468065}, 'support': {'supports': 2200, 'contradicts': 268, 'parts_of_same': 520}, 'micro_avg': {'precision': 0.8668005354752343, 'recall': 0.8668005354752343, 'f1': 0.8668005354752343, 'support': None}, 'macro_avg': {'precision': 0.7713935533992369, 'recall': 0.773347423720558, 'f1': 0.7723476410323847, 'support': None}, 'weighted_avg': {'precision': 0.8670338034532524, 'recall': 0.8668005354752343, 'f1': 0.8669046625091839, 'support': None}}
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 10---------------
Evaluating
				 {'precision': {'supports': 0.9377289377289377, 'contradicts': 0.413135593220339, 'parts_of_same': 0.7173553719008264}, 'recall': {'supports': 0.8145454545454546, 'contradicts': 0.7276119402985075, 'parts_of_same': 0.8346153846153846}, 'f1': {'supports': 0.8718073461444903, 'contradicts': 0.527027027027027, 'parts_of_same': 0.7715555555555556}, 'support': {'supports': 2200, 'contradicts': 268, 'parts_of_same': 520}, 'micro_avg': {'precision': 0.8102409638554217, 'recall': 0.8102409638554217, 'f1': 0.8102409638554217, 'support': None}, 'macro_avg': {'precision': 0.6894066342833677, 'recall': 0.7922575931531156, 'f1': 0.7234633095756909, 'support': None}, 'weighted_avg': {'precision': 0.8523255673946264, 'recall': 0.8102409638554217, 'f1': 0.8234365105923731, 'support': None}}
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 11---------------
Evaluating
				 {'precision': {'supports': 0.9340712223291626, 'contradicts': 0.6013986013986014, 'parts_of_same': 0.7131410256410257}, 'recall': {'supports': 0.8818718764198091, 'contradicts': 0.6417910447761194, 'parts_of_same': 0.8574181117533719}, 'f1': {'supports': 0.9072213133909791, 'contradicts': 0.6209386281588447, 'parts_of_same': 0.7786526684164481}, 'support': {'supports': 2201, 'contradicts': 268, 'parts_of_same': 519}, 'micro_avg': {'precision': 0.856091030789826, 'recall': 0.856091030789826, 'f1': 0.8560910307898261, 'support': None}, 'macro_avg': {'precision': 0.7495369497895966, 'recall': 0.7936936776497667, 'f1': 0.768937536655424, 'support': None}, 'weighted_avg': {'precision': 0.8658586940525449, 'recall': 0.856091030789826, 'f1': 0.8592123152704992, 'support': None}}
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 12---------------
Evaluating
				 {'precision': {'supports': 0.9191588785046729, 'contradicts': 0.5377643504531722, 'parts_of_same': 0.7659574468085106}, 'recall': {'supports': 0.894090909090909, 'contradicts': 0.664179104477612, 'parts_of_same': 0.7615384615384615}, 'f1': {'supports': 0.9064516129032258, 'contradicts': 0.5943238731218697, 'parts_of_same': 0.76374156219865}, 'support': {'supports': 2200, 'contradicts': 268, 'parts_of_same': 520}, 'micro_avg': {'precision': 0.8504016064257028, 'recall': 0.8504016064257028, 'f1': 0.8504016064257028, 'support': None}, 'macro_avg': {'precision': 0.7409602252554519, 'recall': 0.7732694917023274, 'f1': 0.7548390160745818, 'support': None}, 'weighted_avg': {'precision': 0.8582892406198649, 'recall': 0.8504016064257028, 'f1': 0.8536204681148113, 'support': None}}
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9430e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 13---------------
Evaluating
				 {'precision': {'supports': 0.9256661991584852, 'contradicts': 0.5523809523809524, 'parts_of_same': 0.7940074906367042}, 'recall': {'supports': 0.8995910949568378, 'contradicts': 0.6492537313432836, 'parts_of_same': 0.8169556840077071}, 'f1': {'supports': 0.912442396313364, 'contradicts': 0.5969125214408234, 'parts_of_same': 0.805318138651472}, 'support': {'supports': 2201, 'contradicts': 268, 'parts_of_same': 519}, 'micro_avg': {'precision': 0.8627844712182061, 'recall': 0.8627844712182061, 'f1': 0.862784471218206, 'support': None}, 'macro_avg': {'precision': 0.7573515473920472, 'recall': 0.7886001701026095, 'f1': 0.7715576854685531, 'support': None}, 'weighted_avg': {'precision': 0.8693170305309138, 'recall': 0.8627844712182061, 'f1': 0.865534934401596, 'support': None}}
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0485e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 14---------------
Evaluating
				 {'precision': {'supports': 0.9259606373008434, 'contradicts': 0.5676567656765676, 'parts_of_same': 0.778584392014519}, 'recall': {'supports': 0.8981818181818182, 'contradicts': 0.6417910447761194, 'parts_of_same': 0.825}, 'f1': {'supports': 0.9118597138901707, 'contradicts': 0.6024518388791593, 'parts_of_same': 0.8011204481792716}, 'support': {'supports': 2200, 'contradicts': 268, 'parts_of_same': 520}, 'micro_avg': {'precision': 0.8624497991967871, 'recall': 0.8624497991967871, 'f1': 0.862449799196787, 'support': None}, 'macro_avg': {'precision': 0.7574005983306433, 'recall': 0.788324287652646, 'f1': 0.7718106669828672, 'support': None}, 'weighted_avg': {'precision': 0.8681758029152362, 'recall': 0.8624497991967871, 'f1': 0.8648363776543546, 'support': None}}
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8971e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 15---------------
Evaluating
				 {'precision': {'supports': 0.9267605633802817, 'contradicts': 0.5676567656765676, 'parts_of_same': 0.7765765765765765}, 'recall': {'supports': 0.8972727272727272, 'contradicts': 0.6417910447761194, 'parts_of_same': 0.8288461538461539}, 'f1': {'supports': 0.9117782909930716, 'contradicts': 0.6024518388791593, 'parts_of_same': 0.8018604651162791}, 'support': {'supports': 2200, 'contradicts': 268, 'parts_of_same': 520}, 'micro_avg': {'precision': 0.8624497991967871, 'recall': 0.8624497991967871, 'f1': 0.862449799196787, 'support': None}, 'macro_avg': {'precision': 0.7569979685444753, 'recall': 0.7893033086316669, 'f1': 0.7720301983295034, 'support': None}, 'weighted_avg': {'precision': 0.8684153522281659, 'recall': 0.8624497991967871, 'f1': 0.8649052124714985, 'support': None}}
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1702e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 16---------------
Evaluating
				 {'precision': {'supports': 0.9271616541353384, 'contradicts': 0.5714285714285714, 'parts_of_same': 0.7728085867620751}, 'recall': {'supports': 0.8968181818181818, 'contradicts': 0.6417910447761194, 'parts_of_same': 0.8307692307692308}, 'f1': {'supports': 0.9117375231053604, 'contradicts': 0.6045694200351494, 'parts_of_same': 0.8007414272474515}, 'support': {'supports': 2200, 'contradicts': 268, 'parts_of_same': 520}, 'micro_avg': {'precision': 0.8624497991967871, 'recall': 0.8624497991967871, 'f1': 0.862449799196787, 'support': None}, 'macro_avg': {'precision': 0.757132937441995, 'recall': 0.7897928191211774, 'f1': 0.7723494567959871, 'support': None}, 'weighted_avg': {'precision': 0.8683932266923965, 'recall': 0.8624497991967871, 'f1': 0.8648703807128139, 'support': None}}
Loss: tensor(9.3207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 17---------------
Evaluating
				 {'precision': {'supports': 0.9271616541353384, 'contradicts': 0.5714285714285714, 'parts_of_same': 0.7728085867620751}, 'recall': {'supports': 0.8968181818181818, 'contradicts': 0.6417910447761194, 'parts_of_same': 0.8307692307692308}, 'f1': {'supports': 0.9117375231053604, 'contradicts': 0.6045694200351494, 'parts_of_same': 0.8007414272474515}, 'support': {'supports': 2200, 'contradicts': 268, 'parts_of_same': 520}, 'micro_avg': {'precision': 0.8624497991967871, 'recall': 0.8624497991967871, 'f1': 0.862449799196787, 'support': None}, 'macro_avg': {'precision': 0.757132937441995, 'recall': 0.7897928191211774, 'f1': 0.7723494567959871, 'support': None}, 'weighted_avg': {'precision': 0.8683932266923965, 'recall': 0.8624497991967871, 'f1': 0.8648703807128139, 'support': None}}
Loss: tensor(6.9343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 18---------------
Evaluating
				 {'precision': {'supports': 0.9272300469483568, 'contradicts': 0.57, 'parts_of_same': 0.7741935483870968}, 'recall': {'supports': 0.8973194002726034, 'contradicts': 0.6404494382022472, 'parts_of_same': 0.8307692307692308}, 'f1': {'supports': 0.912029554375433, 'contradicts': 0.6031746031746033, 'parts_of_same': 0.8014842300556586}, 'support': {'supports': 2201, 'contradicts': 267, 'parts_of_same': 520}, 'micro_avg': {'precision': 0.8627844712182061, 'recall': 0.8627844712182061, 'f1': 0.862784471218206, 'support': None}, 'macro_avg': {'precision': 0.7571411984451512, 'recall': 0.7895126897480272, 'f1': 0.7722294625352317, 'support': None}, 'weighted_avg': {'precision': 0.8686760302860185, 'recall': 0.8627844712182061, 'f1': 0.8651929276629484, 'support': None}}
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1724e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 19---------------
Evaluating
				 {'precision': {'supports': 0.9272641952135148, 'contradicts': 0.5752508361204013, 'parts_of_same': 0.7741935483870968}, 'recall': {'supports': 0.8981818181818182, 'contradicts': 0.6417910447761194, 'parts_of_same': 0.8307692307692308}, 'f1': {'supports': 0.9124913414915724, 'contradicts': 0.6067019400352733, 'parts_of_same': 0.8014842300556586}, 'support': {'supports': 2200, 'contradicts': 268, 'parts_of_same': 520}, 'micro_avg': {'precision': 0.8634538152610441, 'recall': 0.8634538152610441, 'f1': 0.8634538152610441, 'support': None}, 'macro_avg': {'precision': 0.7589028599070042, 'recall': 0.7902473645757229, 'f1': 0.7735591705275014, 'support': None}, 'weighted_avg': {'precision': 0.8690525765432698, 'recall': 0.8634538152610441, 'f1': 0.8657459407094561, 'support': None}}
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5137e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 20---------------
Evaluating
				 {'precision': {'supports': 0.927665570690465, 'contradicts': 0.5752508361204013, 'parts_of_same': 0.7732142857142857}, 'recall': {'supports': 0.8977272727272727, 'contradicts': 0.6417910447761194, 'parts_of_same': 0.8326923076923077}, 'f1': {'supports': 0.9124509124509124, 'contradicts': 0.6067019400352733, 'parts_of_same': 0.8018518518518519}, 'support': {'supports': 2200, 'contradicts': 268, 'parts_of_same': 520}, 'micro_avg': {'precision': 0.8634538152610441, 'recall': 0.8634538152610441, 'f1': 0.8634538152610441, 'support': None}, 'macro_avg': {'precision': 0.7587102308417174, 'recall': 0.7907368750652334, 'f1': 0.7736682347793459, 'support': None}, 'weighted_avg': {'precision': 0.8691776801106823, 'recall': 0.8634538152610441, 'f1': 0.8657801506975983, 'support': None}}
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 21---------------
Evaluating
				 {'precision': {'supports': 0.9272983114446529, 'contradicts': 0.5791245791245792, 'parts_of_same': 0.7728085867620751}, 'recall': {'supports': 0.8986363636363637, 'contradicts': 0.6417910447761194, 'parts_of_same': 0.8307692307692308}, 'f1': {'supports': 0.9127423822714682, 'contradicts': 0.6088495575221239, 'parts_of_same': 0.8007414272474515}, 'support': {'supports': 2200, 'contradicts': 268, 'parts_of_same': 520}, 'micro_avg': {'precision': 0.8637884872824632, 'recall': 0.8637884872824632, 'f1': 0.863788487282463, 'support': None}, 'macro_avg': {'precision': 0.7597438257771024, 'recall': 0.790398879727238, 'f1': 0.7741111223470146, 'support': None}, 'weighted_avg': {'precision': 0.8691841156291509, 'recall': 0.8637884872824632, 'f1': 0.865994131386156, 'support': None}}
Loss: tensor(9.1455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7937e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 22---------------
Evaluating
				 {'precision': {'supports': 0.9269320843091335, 'contradicts': 0.5777027027027027, 'parts_of_same': 0.7755834829443446}, 'recall': {'supports': 0.8995454545454545, 'contradicts': 0.6380597014925373, 'parts_of_same': 0.8307692307692308}, 'f1': {'supports': 0.913033448673587, 'contradicts': 0.6063829787234043, 'parts_of_same': 0.8022284122562673}, 'support': {'supports': 2200, 'contradicts': 268, 'parts_of_same': 520}, 'micro_avg': {'precision': 0.8641231593038822, 'recall': 0.8641231593038822, 'f1': 0.8641231593038822, 'support': None}, 'macro_avg': {'precision': 0.7600727566520603, 'recall': 0.789458128935741, 'f1': 0.7738816132177528, 'support': None}, 'weighted_avg': {'precision': 0.8692698530573886, 'recall': 0.8641231593038822, 'f1': 0.8662459838530867, 'support': None}}
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 23---------------
Evaluating
				 {'precision': {'supports': 0.9269662921348315, 'contradicts': 0.5796610169491525, 'parts_of_same': 0.7755834829443446}, 'recall': {'supports': 0.9, 'contradicts': 0.6380597014925373, 'parts_of_same': 0.8307692307692308}, 'f1': {'supports': 0.9132841328413285, 'contradicts': 0.6074600355239786, 'parts_of_same': 0.8022284122562673}, 'support': {'supports': 2200, 'contradicts': 268, 'parts_of_same': 520}, 'micro_avg': {'precision': 0.8644578313253012, 'recall': 0.8644578313253012, 'f1': 0.8644578313253012, 'support': None}, 'macro_avg': {'precision': 0.7607369306761096, 'recall': 0.7896096440872561, 'f1': 0.7743241935405248, 'support': None}, 'weighted_avg': {'precision': 0.8694706848628051, 'recall': 0.8644578313253012, 'f1': 0.8665271606909665, 'support': None}}
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 24---------------
Evaluating
				 {'precision': {'supports': 0.9270004679457183, 'contradicts': 0.5796610169491525, 'parts_of_same': 0.7751798561151079}, 'recall': {'supports': 0.9000454338936847, 'contradicts': 0.6380597014925373, 'parts_of_same': 0.8304431599229287}, 'f1': {'supports': 0.9133241124942371, 'contradicts': 0.6074600355239786, 'parts_of_same': 0.801860465116279}, 'support': {'supports': 2201, 'contradicts': 268, 'parts_of_same': 519}, 'micro_avg': {'precision': 0.8644578313253012, 'recall': 0.8644578313253012, 'f1': 0.8644578313253012, 'support': None}, 'macro_avg': {'precision': 0.7606137803366595, 'recall': 0.7895160984363837, 'f1': 0.7742148710448316, 'support': None}, 'weighted_avg': {'precision': 0.8694764149312719, 'recall': 0.8644578313253012, 'f1': 0.8665298669730894, 'support': None}}
Loss: tensor(3.5349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 25---------------
Evaluating
				 {'precision': {'supports': 0.9265668849391955, 'contradicts': 0.5816326530612245, 'parts_of_same': 0.7751798561151079}, 'recall': {'supports': 0.9004545454545455, 'contradicts': 0.6380597014925373, 'parts_of_same': 0.8288461538461539}, 'f1': {'supports': 0.9133241124942371, 'contradicts': 0.608540925266904, 'parts_of_same': 0.8011152416356877}, 'support': {'supports': 2200, 'contradicts': 268, 'parts_of_same': 520}, 'micro_avg': {'precision': 0.8644578313253012, 'recall': 0.8644578313253012, 'f1': 0.8644578313253012, 'support': None}, 'macro_avg': {'precision': 0.761126464705176, 'recall': 0.7891201335977457, 'f1': 0.7743267597989428, 'support': None}, 'weighted_avg': {'precision': 0.869283207184235, 'recall': 0.8644578313253012, 'f1': 0.8664598196483966, 'support': None}}
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 26---------------
Evaluating
				 {'precision': {'supports': 0.9265325222274217, 'contradicts': 0.5816326530612245, 'parts_of_same': 0.7737881508078994}, 'recall': {'supports': 0.9, 'contradicts': 0.6380597014925373, 'parts_of_same': 0.8288461538461539}, 'f1': {'supports': 0.913073553147337, 'contradicts': 0.608540925266904, 'parts_of_same': 0.8003714020427113}, 'support': {'supports': 2200, 'contradicts': 268, 'parts_of_same': 520}, 'micro_avg': {'precision': 0.8641231593038822, 'recall': 0.8641231593038822, 'f1': 0.8641231593038822, 'support': None}, 'macro_avg': {'precision': 0.7606511086988487, 'recall': 0.7889686184462305, 'f1': 0.7739952934856508, 'support': None}, 'weighted_avg': {'precision': 0.8690157089494122, 'recall': 0.8641231593038822, 'f1': 0.8661458882054488, 'support': None}}
Loss: tensor(1.8564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 27---------------
Evaluating
				 {'precision': {'supports': 0.9265325222274217, 'contradicts': 0.5816326530612245, 'parts_of_same': 0.7737881508078994}, 'recall': {'supports': 0.9, 'contradicts': 0.6380597014925373, 'parts_of_same': 0.8288461538461539}, 'f1': {'supports': 0.913073553147337, 'contradicts': 0.608540925266904, 'parts_of_same': 0.8003714020427113}, 'support': {'supports': 2200, 'contradicts': 268, 'parts_of_same': 520}, 'micro_avg': {'precision': 0.8641231593038822, 'recall': 0.8641231593038822, 'f1': 0.8641231593038822, 'support': None}, 'macro_avg': {'precision': 0.7606511086988487, 'recall': 0.7889686184462305, 'f1': 0.7739952934856508, 'support': None}, 'weighted_avg': {'precision': 0.8690157089494122, 'recall': 0.8641231593038822, 'f1': 0.8661458882054488, 'support': None}}
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4174e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1626e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 28---------------
Evaluating
				 {'precision': {'supports': 0.9264981273408239, 'contradicts': 0.5816326530612245, 'parts_of_same': 0.7724014336917563}, 'recall': {'supports': 0.8995454545454545, 'contradicts': 0.6380597014925373, 'parts_of_same': 0.8288461538461539}, 'f1': {'supports': 0.9128228782287822, 'contradicts': 0.608540925266904, 'parts_of_same': 0.7996289424860853}, 'support': {'supports': 2200, 'contradicts': 268, 'parts_of_same': 520}, 'micro_avg': {'precision': 0.8637884872824632, 'recall': 0.8637884872824632, 'f1': 0.863788487282463, 'support': None}, 'macro_avg': {'precision': 0.7601774046979348, 'recall': 0.7888171032947153, 'f1': 0.7736642486605905, 'support': None}, 'weighted_avg': {'precision': 0.8687490551171132, 'recall': 0.8637884872824632, 'f1': 0.8658321118365513, 'support': None}}
Loss: tensor(8.9635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 29---------------
Evaluating
				 {'precision': {'supports': 0.9269320843091335, 'contradicts': 0.5836177474402731, 'parts_of_same': 0.7714285714285715}, 'recall': {'supports': 0.8995454545454545, 'contradicts': 0.6380597014925373, 'parts_of_same': 0.8307692307692308}, 'f1': {'supports': 0.913033448673587, 'contradicts': 0.609625668449198, 'parts_of_same': 0.8}, 'support': {'supports': 2200, 'contradicts': 268, 'parts_of_same': 520}, 'micro_avg': {'precision': 0.8641231593038822, 'recall': 0.8641231593038822, 'f1': 0.8641231593038822, 'support': None}, 'macro_avg': {'precision': 0.7606594677259927, 'recall': 0.789458128935741, 'f1': 0.774219705707595, 'support': None}, 'weighted_avg': {'precision': 0.8690773088811727, 'recall': 0.8641231593038822, 'f1': 0.8661490181480176, 'support': None}}
Loss: tensor(8.9973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 30---------------
Evaluating
				 {'precision': {'supports': 0.9269320843091335, 'contradicts': 0.5836177474402731, 'parts_of_same': 0.7714285714285715}, 'recall': {'supports': 0.8995454545454545, 'contradicts': 0.6380597014925373, 'parts_of_same': 0.8307692307692308}, 'f1': {'supports': 0.913033448673587, 'contradicts': 0.609625668449198, 'parts_of_same': 0.8}, 'support': {'supports': 2200, 'contradicts': 268, 'parts_of_same': 520}, 'micro_avg': {'precision': 0.8641231593038822, 'recall': 0.8641231593038822, 'f1': 0.8641231593038822, 'support': None}, 'macro_avg': {'precision': 0.7606594677259927, 'recall': 0.789458128935741, 'f1': 0.774219705707595, 'support': None}, 'weighted_avg': {'precision': 0.8690773088811727, 'recall': 0.8641231593038822, 'f1': 0.8661490181480176, 'support': None}}
Loss: tensor(8.6285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)


		-------------RUN 5-----------
			------------EPOCH 1---------------
Evaluating
				 {'precision': {'supports': 0.0, 'contradicts': 0.0908781484002723, 'parts_of_same': 0.0}, 'recall': {'supports': 0.0, 'contradicts': 1.0, 'parts_of_same': 0.0}, 'f1': {'supports': 0.0, 'contradicts': 0.16661466458658347, 'parts_of_same': 0.0}, 'support': {'supports': 2144, 'contradicts': 267, 'parts_of_same': 527}, 'micro_avg': {'precision': 0.0908781484002723, 'recall': 0.0908781484002723, 'f1': 0.0908781484002723, 'support': None}, 'macro_avg': {'precision': 0.0302927161334241, 'recall': 0.3333333333333333, 'f1': 0.055538221528861155, 'support': None}, 'weighted_avg': {'precision': 0.008258837856661913, 'recall': 0.0908781484002723, 'f1': 0.015141632213961125, 'support': None}}
Loss: tensor(1.4985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2781, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 2---------------
Evaluating
				 {'precision': {'supports': 0.9395638629283489, 'contradicts': 0.5434173669467787, 'parts_of_same': 0.47540983606557374}, 'recall': {'supports': 0.703030303030303, 'contradicts': 0.7265917602996255, 'parts_of_same': 0.8821292775665399}, 'f1': {'supports': 0.8042666666666666, 'contradicts': 0.6217948717948718, 'parts_of_same': 0.6178428761651132}, 'support': {'supports': 2145, 'contradicts': 267, 'parts_of_same': 526}, 'micro_avg': {'precision': 0.7372362151123213, 'recall': 0.7372362151123213, 'f1': 0.7372362151123213, 'support': None}, 'macro_avg': {'precision': 0.6527970219802337, 'recall': 0.7705837802988228, 'f1': 0.6813014715422172, 'support': None}, 'weighted_avg': {'precision': 0.8204637497367564, 'recall': 0.7372362151123213, 'f1': 0.7543078909571409, 'support': None}}
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 3---------------
Evaluating
				 {'precision': {'supports': 0.9491206030150754, 'contradicts': 0.3763779527559055, 'parts_of_same': 0.5864978902953587}, 'recall': {'supports': 0.7044289044289044, 'contradicts': 0.8984962406015038, 'parts_of_same': 0.7912713472485768}, 'f1': {'supports': 0.8086700561948087, 'contradicts': 0.5305216426193119, 'parts_of_same': 0.6736672051696285}, 'support': {'supports': 2145, 'contradicts': 266, 'parts_of_same': 527}, 'micro_avg': {'precision': 0.737576582709326, 'recall': 0.737576582709326, 'f1': 0.737576582709326, 'support': None}, 'macro_avg': {'precision': 0.6373321486887799, 'recall': 0.7980654974263283, 'f1': 0.670952967994583, 'support': None}, 'weighted_avg': {'precision': 0.8322207682389591, 'recall': 0.737576582709326, 'f1': 0.7592711520078271, 'support': None}}
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 4---------------
Evaluating
				 {'precision': {'supports': 0.9281267685342388, 'contradicts': 0.54858934169279, 'parts_of_same': 0.5258215962441315}, 'recall': {'supports': 0.7649253731343284, 'contradicts': 0.6554307116104869, 'parts_of_same': 0.8500948766603416}, 'f1': {'supports': 0.8386601892099207, 'contradicts': 0.597269624573379, 'parts_of_same': 0.649746192893401}, 'support': {'supports': 2144, 'contradicts': 267, 'parts_of_same': 527}, 'micro_avg': {'precision': 0.7702518720217836, 'recall': 0.7702518720217836, 'f1': 0.7702518720217836, 'support': None}, 'macro_avg': {'precision': 0.66751256882372, 'recall': 0.7568169871350522, 'f1': 0.6952253355589001, 'support': None}, 'weighted_avg': {'precision': 0.8214721331484139, 'recall': 0.7702518720217836, 'f1': 0.782836854690941, 'support': None}}
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 5---------------
Evaluating
				 {'precision': {'supports': 0.9032872796569795, 'contradicts': 0.6415770609318996, 'parts_of_same': 0.6964285714285714}, 'recall': {'supports': 0.8843283582089553, 'contradicts': 0.6704119850187266, 'parts_of_same': 0.7400379506641366}, 'f1': {'supports': 0.893707282583078, 'contradicts': 0.6556776556776557, 'parts_of_same': 0.717571297148114}, 'support': {'supports': 2144, 'contradicts': 267, 'parts_of_same': 527}, 'micro_avg': {'precision': 0.8390061266167461, 'recall': 0.8390061266167461, 'f1': 0.8390061266167461, 'support': None}, 'macro_avg': {'precision': 0.7470976373391501, 'recall': 0.7649260979639395, 'f1': 0.7556520784696158, 'support': None}, 'weighted_avg': {'precision': 0.8423985228033488, 'recall': 0.8390061266167461, 'f1': 0.8404814232542918, 'support': None}}
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 6---------------
Evaluating
				 {'precision': {'supports': 0.9164376030786147, 'contradicts': 0.4914772727272727, 'parts_of_same': 0.5658409387222947}, 'recall': {'supports': 0.777518656716418, 'contradicts': 0.6479400749063671, 'parts_of_same': 0.8235294117647058}, 'f1': {'supports': 0.8412818571789049, 'contradicts': 0.5589660743134087, 'parts_of_same': 0.6707882534775889}, 'support': {'supports': 2144, 'contradicts': 267, 'parts_of_same': 527}, 'micro_avg': {'precision': 0.773995915588836, 'recall': 0.773995915588836, 'f1': 0.773995915588836, 'support': None}, 'macro_avg': {'precision': 0.6579186048427274, 'recall': 0.749662714462497, 'f1': 0.6903453949899676, 'support': None}, 'weighted_avg': {'precision': 0.8149301659378424, 'recall': 0.773995915588836, 'f1': 0.78504344901836, 'support': None}}
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 7---------------
Evaluating
				 {'precision': {'supports': 0.9095643939393939, 'contradicts': 0.72, 'parts_of_same': 0.7060702875399361}, 'recall': {'supports': 0.8955710955710956, 'contradicts': 0.5413533834586466, 'parts_of_same': 0.8387096774193549}, 'f1': {'supports': 0.90251350716467, 'contradicts': 0.6180257510729614, 'parts_of_same': 0.766695576756288}, 'support': {'supports': 2145, 'contradicts': 266, 'parts_of_same': 527}, 'micro_avg': {'precision': 0.8533015656909462, 'recall': 0.8533015656909462, 'f1': 0.8533015656909462, 'support': None}, 'macro_avg': {'precision': 0.7785448938264432, 'recall': 0.7585447188163656, 'f1': 0.7624116116646399, 'support': None}, 'weighted_avg': {'precision': 0.855900158792902, 'recall': 0.8533015656909462, 'f1': 0.8523944491505067, 'support': None}}
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 8---------------
Evaluating
				 {'precision': {'supports': 0.9298561151079137, 'contradicts': 0.36869565217391304, 'parts_of_same': 0.6100719424460431}, 'recall': {'supports': 0.7230769230769231, 'contradicts': 0.7940074906367042, 'parts_of_same': 0.8060836501901141}, 'f1': {'supports': 0.8135326514555469, 'contradicts': 0.503562945368171, 'parts_of_same': 0.6945126945126945}, 'support': {'supports': 2145, 'contradicts': 267, 'parts_of_same': 526}, 'micro_avg': {'precision': 0.7443839346494214, 'recall': 0.7443839346494214, 'f1': 0.7443839346494214, 'support': None}, 'macro_avg': {'precision': 0.6362079032426232, 'recall': 0.7743893546345805, 'f1': 0.6705360971121376, 'support': None}, 'weighted_avg': {'precision': 0.8216068576458573, 'recall': 0.7443839346494214, 'f1': 0.7640546361807784, 'support': None}}
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 9---------------
Evaluating
				 {'precision': {'supports': 0.9206670035371399, 'contradicts': 0.5776173285198556, 'parts_of_same': 0.6524926686217009}, 'recall': {'supports': 0.8494172494172494, 'contradicts': 0.599250936329588, 'parts_of_same': 0.8460076045627376}, 'f1': {'supports': 0.8836081474296799, 'contradicts': 0.5882352941176471, 'parts_of_same': 0.7367549668874172}, 'support': {'supports': 2145, 'contradicts': 267, 'parts_of_same': 526}, 'micro_avg': {'precision': 0.826072157930565, 'recall': 0.826072157930565, 'f1': 0.826072157930565, 'support': None}, 'macro_avg': {'precision': 0.7169256668928988, 'recall': 0.7648919301031917, 'f1': 0.736199469478248, 'support': None}, 'weighted_avg': {'precision': 0.841479133082703, 'recall': 0.826072157930565, 'f1': 0.8304735916776231, 'support': None}}
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 10---------------
Evaluating
				 {'precision': {'supports': 0.8793026374608851, 'contradicts': 0.5924528301886792, 'parts_of_same': 0.7981651376146789}, 'recall': {'supports': 0.9174440298507462, 'contradicts': 0.5880149812734082, 'parts_of_same': 0.6603415559772297}, 'f1': {'supports': 0.8979685003423875, 'contradicts': 0.5902255639097744, 'parts_of_same': 0.7227414330218068}, 'support': {'supports': 2144, 'contradicts': 267, 'parts_of_same': 527}, 'micro_avg': {'precision': 0.8413886997957795, 'recall': 0.8413886997957795, 'f1': 0.8413886997957793, 'support': None}, 'macro_avg': {'precision': 0.7566402017547477, 'recall': 0.7219335223671282, 'f1': 0.736978499091323, 'support': None}, 'weighted_avg': {'precision': 0.8386803226342583, 'recall': 0.8413886997957795, 'f1': 0.8385702605515591, 'support': None}}
Loss: tensor(4.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 11---------------
Evaluating
				 {'precision': {'supports': 0.8762886597938144, 'contradicts': 0.5518518518518518, 'parts_of_same': 0.7871853546910755}, 'recall': {'supports': 0.9118470149253731, 'contradicts': 0.5580524344569289, 'parts_of_same': 0.6527514231499051}, 'f1': {'supports': 0.8937142857142856, 'contradicts': 0.5549348230912478, 'parts_of_same': 0.7136929460580913}, 'support': {'supports': 2144, 'contradicts': 267, 'parts_of_same': 527}, 'micro_avg': {'precision': 0.8332198774676651, 'recall': 0.8332198774676651, 'f1': 0.8332198774676651, 'support': None}, 'macro_avg': {'precision': 0.7384419554455807, 'recall': 0.7075502908440691, 'f1': 0.7207806849545415, 'support': None}, 'weighted_avg': {'precision': 0.8308216517918922, 'recall': 0.8332198774676651, 'f1': 0.8306355374096003, 'support': None}}
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5089, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 12---------------
Evaluating
				 {'precision': {'supports': 0.9, 'contradicts': 0.5975609756097561, 'parts_of_same': 0.6877076411960132}, 'recall': {'supports': 0.8773320895522388, 'contradicts': 0.550561797752809, 'parts_of_same': 0.7855787476280834}, 'f1': {'supports': 0.8885214926783184, 'contradicts': 0.5730994152046784, 'parts_of_same': 0.7333923826395038}, 'support': {'supports': 2144, 'contradicts': 267, 'parts_of_same': 527}, 'micro_avg': {'precision': 0.8311776718856365, 'recall': 0.8311776718856365, 'f1': 0.8311776718856365, 'support': None}, 'macro_avg': {'precision': 0.7284228722685898, 'recall': 0.7378242116443771, 'f1': 0.7316710968408335, 'support': None}, 'weighted_avg': {'precision': 0.834435230564365, 'recall': 0.8311776718856365, 'f1': 0.8320304322031934, 'support': None}}
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 13---------------
Evaluating
				 {'precision': {'supports': 0.9148827726809379, 'contradicts': 0.5141242937853108, 'parts_of_same': 0.6704180064308681}, 'recall': {'supports': 0.8372201492537313, 'contradicts': 0.6816479400749064, 'parts_of_same': 0.7912713472485768}, 'f1': {'supports': 0.8743302484169508, 'contradicts': 0.5861513687600644, 'parts_of_same': 0.7258485639686683}, 'support': {'supports': 2144, 'contradicts': 267, 'parts_of_same': 527}, 'micro_avg': {'precision': 0.8148400272294077, 'recall': 0.8148400272294077, 'f1': 0.8148400272294077, 'support': None}, 'macro_avg': {'precision': 0.6998083576323723, 'recall': 0.7700464788590716, 'f1': 0.7287767270485611, 'support': None}, 'weighted_avg': {'precision': 0.8346120287466563, 'recall': 0.8148400272294077, 'f1': 0.8215073727965854, 'support': None}}
Loss: tensor(0.4891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 14---------------
Evaluating
				 {'precision': {'supports': 0.8968588842006564, 'contradicts': 0.5344262295081967, 'parts_of_same': 0.774}, 'recall': {'supports': 0.8922574626865671, 'contradicts': 0.6104868913857678, 'parts_of_same': 0.7343453510436433}, 'f1': {'supports': 0.8945522562543838, 'contradicts': 0.56993006993007, 'parts_of_same': 0.75365141187926}, 'support': {'supports': 2144, 'contradicts': 267, 'parts_of_same': 527}, 'micro_avg': {'precision': 0.8383253914227365, 'recall': 0.8383253914227365, 'f1': 0.8383253914227365, 'support': None}, 'macro_avg': {'precision': 0.7350950379029509, 'recall': 0.7456965683719927, 'f1': 0.7393779126879046, 'support': None}, 'weighted_avg': {'precision': 0.8418840200833547, 'recall': 0.8383253914227365, 'f1': 0.8397772839146009, 'support': None}}
Loss: tensor(9.2431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 15---------------
Evaluating
				 {'precision': {'supports': 0.8997867803837953, 'contradicts': 0.3241590214067278, 'parts_of_same': 0.7941176470588235}, 'recall': {'supports': 0.7873134328358209, 'contradicts': 0.7940074906367042, 'parts_of_same': 0.6148007590132827}, 'f1': {'supports': 0.8398009950248757, 'contradicts': 0.46036916395222577, 'parts_of_same': 0.6930481283422459}, 'support': {'supports': 2144, 'contradicts': 267, 'parts_of_same': 527}, 'micro_avg': {'precision': 0.7569775357385977, 'recall': 0.7569775357385977, 'f1': 0.7569775357385977, 'support': None}, 'macro_avg': {'precision': 0.6726878162831156, 'recall': 0.7320405608286026, 'f1': 0.6644060957731158, 'support': None}, 'weighted_avg': {'precision': 0.8285205295638031, 'recall': 0.7569775357385977, 'f1': 0.7789953246238738, 'support': None}}
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 16---------------
Evaluating
				 {'precision': {'supports': 0.8868445262189513, 'contradicts': 0.5488721804511278, 'parts_of_same': 0.751004016064257}, 'recall': {'supports': 0.8992537313432836, 'contradicts': 0.5468164794007491, 'parts_of_same': 0.7096774193548387}, 'f1': {'supports': 0.8930060213061604, 'contradicts': 0.5478424015009381, 'parts_of_same': 0.7297560975609757}, 'support': {'supports': 2144, 'contradicts': 267, 'parts_of_same': 527}, 'micro_avg': {'precision': 0.8332198774676651, 'recall': 0.8332198774676651, 'f1': 0.8332198774676651, 'support': None}, 'macro_avg': {'precision': 0.728906907578112, 'recall': 0.7185825433662906, 'f1': 0.7235348401226914, 'support': None}, 'weighted_avg': {'precision': 0.8317640070999817, 'recall': 0.8332198774676651, 'f1': 0.8323554439400246, 'support': None}}
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 17---------------
Evaluating
				 {'precision': {'supports': 0.9017153453871117, 'contradicts': 0.600896860986547, 'parts_of_same': 0.7455197132616488}, 'recall': {'supports': 0.9067599067599068, 'contradicts': 0.50187265917603, 'parts_of_same': 0.7908745247148289}, 'f1': {'supports': 0.9042305904230592, 'contradicts': 0.5469387755102042, 'parts_of_same': 0.7675276752767527}, 'support': {'supports': 2145, 'contradicts': 267, 'parts_of_same': 526}, 'micro_avg': {'precision': 0.8492171545268891, 'recall': 0.8492171545268891, 'f1': 0.8492171545268891, 'support': None}, 'macro_avg': {'precision': 0.7493773065451025, 'recall': 0.7331690302169219, 'f1': 0.7395656804033387, 'support': None}, 'weighted_avg': {'precision': 0.8464132903044214, 'recall': 0.8492171545268891, 'f1': 0.8472861901682296, 'support': None}}
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 18---------------
Evaluating
				 {'precision': {'supports': 0.9173635022134776, 'contradicts': 0.5691056910569106, 'parts_of_same': 0.6828528072837633}, 'recall': {'supports': 0.8698694029850746, 'contradicts': 0.5243445692883895, 'parts_of_same': 0.8538899430740038}, 'f1': {'supports': 0.8929853962173809, 'contradicts': 0.5458089668615984, 'parts_of_same': 0.7588532883642495}, 'support': {'supports': 2144, 'contradicts': 267, 'parts_of_same': 527}, 'micro_avg': {'precision': 0.8356024506466985, 'recall': 0.8356024506466985, 'f1': 0.8356024506466985, 'support': None}, 'macro_avg': {'precision': 0.7231073335180506, 'recall': 0.7493679717824894, 'f1': 0.732549217147743, 'support': None}, 'weighted_avg': {'precision': 0.843649420591026, 'recall': 0.8356024506466985, 'f1': 0.8373748695064911, 'support': None}}
Loss: tensor(3.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 19---------------
Evaluating
				 {'precision': {'supports': 0.920059582919563, 'contradicts': 0.5914893617021276, 'parts_of_same': 0.6618287373004355}, 'recall': {'supports': 0.8642723880597015, 'contradicts': 0.5205992509363296, 'parts_of_same': 0.8652751423149905}, 'f1': {'supports': 0.8912938912938914, 'contradicts': 0.553784860557769, 'parts_of_same': 0.75}, 'support': {'supports': 2144, 'contradicts': 267, 'parts_of_same': 527}, 'micro_avg': {'precision': 0.8332198774676651, 'recall': 0.8332198774676651, 'f1': 0.8332198774676651, 'support': None}, 'macro_avg': {'precision': 0.7244592273073754, 'recall': 0.7500489271036739, 'f1': 0.7316929172838869, 'support': None}, 'weighted_avg': {'precision': 0.8438799012632202, 'recall': 0.8332198774676651, 'f1': 0.8352772841058635, 'support': None}}
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7105e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 20---------------
Evaluating
				 {'precision': {'supports': 0.9122390891840607, 'contradicts': 0.594017094017094, 'parts_of_same': 0.7315436241610739}, 'recall': {'supports': 0.8969216417910447, 'contradicts': 0.5205992509363296, 'parts_of_same': 0.8273244781783681}, 'f1': {'supports': 0.9045155221072437, 'contradicts': 0.5548902195608783, 'parts_of_same': 0.7764915405164737}, 'support': {'supports': 2144, 'contradicts': 267, 'parts_of_same': 527}, 'micro_avg': {'precision': 0.8502382573179034, 'recall': 0.8502382573179034, 'f1': 0.8502382573179034, 'support': None}, 'macro_avg': {'precision': 0.7459332691207429, 'recall': 0.7482817903019141, 'f1': 0.7452990940615319, 'support': None}, 'weighted_avg': {'precision': 0.8509076450803527, 'recall': 0.8502382573179034, 'f1': 0.8497780836871568, 'support': None}}
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 21---------------
Evaluating
				 {'precision': {'supports': 0.9142994703899856, 'contradicts': 0.5948275862068966, 'parts_of_same': 0.7011128775834659}, 'recall': {'supports': 0.8853146853146853, 'contradicts': 0.5168539325842697, 'parts_of_same': 0.8384030418250951}, 'f1': {'supports': 0.8995736617716721, 'contradicts': 0.5531062124248497, 'parts_of_same': 0.7636363636363636}, 'support': {'supports': 2145, 'contradicts': 267, 'parts_of_same': 526}, 'micro_avg': {'precision': 0.8434309053778081, 'recall': 0.8434309053778081, 'f1': 0.8434309053778081, 'support': None}, 'macro_avg': {'precision': 0.7367466447267826, 'recall': 0.7468572199080167, 'f1': 0.7387720792776284, 'support': None}, 'weighted_avg': {'precision': 0.8470989459198991, 'recall': 0.8434309053778081, 'f1': 0.8437500307999996, 'support': None}}
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 22---------------
Evaluating
				 {'precision': {'supports': 0.9143819143819144, 'contradicts': 0.5930735930735931, 'parts_of_same': 0.7038216560509554}, 'recall': {'supports': 0.886660447761194, 'contradicts': 0.5131086142322098, 'parts_of_same': 0.8387096774193549}, 'f1': {'supports': 0.9003078380298366, 'contradicts': 0.5502008032128515, 'parts_of_same': 0.7653679653679653}, 'support': {'supports': 2144, 'contradicts': 267, 'parts_of_same': 527}, 'micro_avg': {'precision': 0.8441116405718175, 'recall': 0.8441116405718175, 'f1': 0.8441116405718175, 'support': None}, 'macro_avg': {'precision': 0.7370923878354877, 'recall': 0.746159579804253, 'f1': 0.7386255355368844, 'support': None}, 'weighted_avg': {'precision': 0.8474130314922831, 'recall': 0.8441116405718175, 'f1': 0.8442860915393869, 'support': None}}
Loss: tensor(6.3055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 23---------------
Evaluating
				 {'precision': {'supports': 0.9143819143819144, 'contradicts': 0.5930735930735931, 'parts_of_same': 0.7038216560509554}, 'recall': {'supports': 0.886660447761194, 'contradicts': 0.5131086142322098, 'parts_of_same': 0.8387096774193549}, 'f1': {'supports': 0.9003078380298366, 'contradicts': 0.5502008032128515, 'parts_of_same': 0.7653679653679653}, 'support': {'supports': 2144, 'contradicts': 267, 'parts_of_same': 527}, 'micro_avg': {'precision': 0.8441116405718175, 'recall': 0.8441116405718175, 'f1': 0.8441116405718175, 'support': None}, 'macro_avg': {'precision': 0.7370923878354877, 'recall': 0.746159579804253, 'f1': 0.7386255355368844, 'support': None}, 'weighted_avg': {'precision': 0.8474130314922831, 'recall': 0.8441116405718175, 'f1': 0.8442860915393869, 'support': None}}
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 24---------------
Evaluating
				 {'precision': {'supports': 0.914066250600096, 'contradicts': 0.5982532751091703, 'parts_of_same': 0.7044728434504792}, 'recall': {'supports': 0.8880597014925373, 'contradicts': 0.5131086142322098, 'parts_of_same': 0.8368121442125237}, 'f1': {'supports': 0.9008753252898036, 'contradicts': 0.5524193548387096, 'parts_of_same': 0.7649609713790112}, 'support': {'supports': 2144, 'contradicts': 267, 'parts_of_same': 527}, 'micro_avg': {'precision': 0.8447923757658271, 'recall': 0.8447923757658271, 'f1': 0.8447923757658271, 'support': None}, 'macro_avg': {'precision': 0.7389307897199151, 'recall': 0.7459934866457569, 'f1': 0.7394185505025082, 'support': None}, 'weighted_avg': {'precision': 0.847770202259754, 'recall': 0.8447923757658271, 'f1': 0.8448288281415974, 'support': None}}
Loss: tensor(3.9356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 25---------------
Evaluating
				 {'precision': {'supports': 0.9137104506232023, 'contradicts': 0.5982532751091703, 'parts_of_same': 0.7062600321027287}, 'recall': {'supports': 0.8889925373134329, 'contradicts': 0.5131086142322098, 'parts_of_same': 0.8349146110056926}, 'f1': {'supports': 0.9011820330969267, 'contradicts': 0.5524193548387096, 'parts_of_same': 0.7652173913043477}, 'support': {'supports': 2144, 'contradicts': 267, 'parts_of_same': 527}, 'micro_avg': {'precision': 0.8451327433628318, 'recall': 0.8451327433628318, 'f1': 0.8451327433628318, 'support': None}, 'macro_avg': {'precision': 0.7394079192783671, 'recall': 0.7456719208504451, 'f1': 0.7396062597466614, 'support': None}, 'weighted_avg': {'precision': 0.8478311325760491, 'recall': 0.8451327433628318, 'f1': 0.8450986425865001, 'support': None}}
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2597e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 26---------------
Evaluating
				 {'precision': {'supports': 0.9137104506232023, 'contradicts': 0.5982532751091703, 'parts_of_same': 0.7062600321027287}, 'recall': {'supports': 0.8889925373134329, 'contradicts': 0.5131086142322098, 'parts_of_same': 0.8349146110056926}, 'f1': {'supports': 0.9011820330969267, 'contradicts': 0.5524193548387096, 'parts_of_same': 0.7652173913043477}, 'support': {'supports': 2144, 'contradicts': 267, 'parts_of_same': 527}, 'micro_avg': {'precision': 0.8451327433628318, 'recall': 0.8451327433628318, 'f1': 0.8451327433628318, 'support': None}, 'macro_avg': {'precision': 0.7394079192783671, 'recall': 0.7456719208504451, 'f1': 0.7396062597466614, 'support': None}, 'weighted_avg': {'precision': 0.8478311325760491, 'recall': 0.8451327433628318, 'f1': 0.8450986425865001, 'support': None}}
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1406e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 27---------------
Evaluating
				 {'precision': {'supports': 0.9133556725706079, 'contradicts': 0.5964912280701754, 'parts_of_same': 0.7085346215780999}, 'recall': {'supports': 0.8899253731343284, 'contradicts': 0.5093632958801498, 'parts_of_same': 0.8349146110056926}, 'f1': {'supports': 0.9014883061658399, 'contradicts': 0.5494949494949495, 'parts_of_same': 0.7665505226480837}, 'support': {'supports': 2144, 'contradicts': 267, 'parts_of_same': 527}, 'micro_avg': {'precision': 0.8454731109598366, 'recall': 0.8454731109598366, 'f1': 0.8454731109598366, 'support': None}, 'macro_avg': {'precision': 0.7394605074062944, 'recall': 0.7447344266733903, 'f1': 0.7391779261029576, 'support': None}, 'weighted_avg': {'precision': 0.8478201039679302, 'recall': 0.8454731109598366, 'f1': 0.8452955089755793, 'support': None}}
Loss: tensor(2.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 28---------------
Evaluating
				 {'precision': {'supports': 0.912960306073649, 'contradicts': 0.5991189427312775, 'parts_of_same': 0.7096774193548387}, 'recall': {'supports': 0.8903917910447762, 'contradicts': 0.5093632958801498, 'parts_of_same': 0.8349146110056926}, 'f1': {'supports': 0.9015348288075561, 'contradicts': 0.5506072874493926, 'parts_of_same': 0.7672188317349607}, 'support': {'supports': 2144, 'contradicts': 267, 'parts_of_same': 527}, 'micro_avg': {'precision': 0.8458134785568414, 'recall': 0.8458134785568414, 'f1': 0.8458134785568414, 'support': None}, 'macro_avg': {'precision': 0.7405855560532549, 'recall': 0.7448898993102061, 'f1': 0.7397869826639698, 'support': None}, 'weighted_avg': {'precision': 0.8479753757423943, 'recall': 0.8458134785568414, 'f1': 0.8455504230894187, 'support': None}}
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8432e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 29---------------
Evaluating
				 {'precision': {'supports': 0.9126491646778043, 'contradicts': 0.6017699115044248, 'parts_of_same': 0.713128038897893}, 'recall': {'supports': 0.8917910447761194, 'contradicts': 0.5093632958801498, 'parts_of_same': 0.8349146110056926}, 'f1': {'supports': 0.9020995517810806, 'contradicts': 0.5517241379310346, 'parts_of_same': 0.7692307692307693}, 'support': {'supports': 2144, 'contradicts': 267, 'parts_of_same': 527}, 'micro_avg': {'precision': 0.8468345813478557, 'recall': 0.8468345813478557, 'f1': 0.8468345813478557, 'support': None}, 'macro_avg': {'precision': 0.7425157050267074, 'recall': 0.745356317220654, 'f1': 0.7410181529809615, 'support': None}, 'weighted_avg': {'precision': 0.8486081865010495, 'recall': 0.8468345813478557, 'f1': 0.846424914646303, 'support': None}}
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 30---------------
Evaluating
				 {'precision': {'supports': 0.9122974261201144, 'contradicts': 0.6017699115044248, 'parts_of_same': 0.7133550488599348}, 'recall': {'supports': 0.8923076923076924, 'contradicts': 0.5093632958801498, 'parts_of_same': 0.8326996197718631}, 'f1': {'supports': 0.9021918453924112, 'contradicts': 0.5517241379310346, 'parts_of_same': 0.7684210526315789}, 'support': {'supports': 2145, 'contradicts': 267, 'parts_of_same': 526}, 'micro_avg': {'precision': 0.8468345813478557, 'recall': 0.8468345813478557, 'f1': 0.8468345813478557, 'support': None}, 'macro_avg': {'precision': 0.742474128828158, 'recall': 0.7447902026532351, 'f1': 0.7407790119850081, 'support': None}, 'weighted_avg': {'precision': 0.8484599391081187, 'recall': 0.8468345813478557, 'f1': 0.8463925550982023, 'support': None}}
Loss: tensor(7.3260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
